Spaces:

ozgurkara
/

RAVE

Running on A10G

App Files Files Community

RAVE / utils /preprocesser_utils.py

ozgurkara

first commit

eb9a9b4 10 months ago

raw

history blame

No virus

6.45 kB

	import cv2
	import yaml

	import numpy as np
	from annotator.lineart import LineartDetector
	from annotator.zoe import ZoeDetector
	from annotator.manga_line import MangaLineExtration
	from annotator.lineart_anime import LineartAnimeDetector
	from annotator.hed import apply_hed
	from annotator.canny import apply_canny
	from annotator.pidinet import apply_pidinet
	from annotator.leres import apply_leres
	from annotator.midas import apply_midas


	def yaml_load(path):
	with open(path, 'r') as stream:
	try:
	return yaml.safe_load(stream)
	except yaml.YAMLError as exc:
	print(exc)

	def yaml_dump(path, data):
	with open(path, 'w') as outfile:
	yaml.dump(data, outfile, default_flow_style=False)

	def pad64(x):
	return int(np.ceil(float(x) / 64.0) * 64 - x)

	def HWC3(x):
	assert x.dtype == np.uint8
	if x.ndim == 2:
	x = x[:, :, None]
	assert x.ndim == 3
	H, W, C = x.shape
	assert C == 1 or C == 3 or C == 4
	if C == 3:
	return x
	if C == 1:
	return np.concatenate([x, x, x], axis=2)
	if C == 4:
	color = x[:, :, 0:3].astype(np.float32)
	alpha = x[:, :, 3:4].astype(np.float32) / 255.0
	y = color * alpha + 255.0 * (1.0 - alpha)
	y = y.clip(0, 255).astype(np.uint8)
	return y

	def safer_memory(x):
	# Fix many MAC/AMD problems
	return np.ascontiguousarray(x.copy()).copy()


	def resize_image_with_pad(input_image, resolution, skip_hwc3=False):
	if skip_hwc3:
	img = input_image
	else:
	img = HWC3(input_image)
	H_raw, W_raw, _ = img.shape
	k = float(resolution) / float(min(H_raw, W_raw))
	interpolation = cv2.INTER_CUBIC if k > 1 else cv2.INTER_AREA
	H_target = int(np.round(float(H_raw) * k))
	W_target = int(np.round(float(W_raw) * k))
	img = cv2.resize(img, (W_target, H_target), interpolation=interpolation)
	H_pad, W_pad = pad64(H_target), pad64(W_target)
	img_padded = np.pad(img, [[0, H_pad], [0, W_pad], [0, 0]], mode='edge')

	def remove_pad(x):
	return safer_memory(x[:H_target, :W_target])

	return safer_memory(img_padded), remove_pad



	def lineart_standard(img, res=512, **kwargs):
	img, remove_pad = resize_image_with_pad(img, res)
	x = img.astype(np.float32)
	g = cv2.GaussianBlur(x, (0, 0), 6.0)
	intensity = np.min(g - x, axis=2).clip(0, 255)
	intensity /= max(16, np.median(intensity[intensity > 8]))
	intensity *= 127
	result = intensity.clip(0, 255).astype(np.uint8)
	return remove_pad(result), True


	def lineart(img, res=512, **kwargs):
	img, remove_pad = resize_image_with_pad(img, res)
	model_lineart = LineartDetector('sk_model.pth')

	# applied auto inversion
	result = 255 - model_lineart(img)
	return remove_pad(result), True


	def lineart_coarse(img, res=512, **kwargs):
	img, remove_pad = resize_image_with_pad(img, res)
	model_lineart_coarse = LineartDetector('sk_model2.pth')

	# applied auto inversion
	result = 255 - model_lineart_coarse(img)
	return remove_pad(result), True

	def lineart_anime(img, res=512, **kwargs):
	img, remove_pad = resize_image_with_pad(img, res)
	model_lineart_anime = LineartAnimeDetector()

	# applied auto inversion
	result = 255 - model_lineart_anime(img)
	return remove_pad(result), True


	def lineart_anime_denoise(img, res=512, **kwargs):
	img, remove_pad = resize_image_with_pad(img, res)
	model_manga_line = MangaLineExtration()

	# applied auto inversion
	result = model_manga_line(img)
	return remove_pad(result), True


	def canny(img, res=512, thr_a=100, thr_b=200, **kwargs):
	l, h = thr_a, thr_b
	img, remove_pad = resize_image_with_pad(img, res)
	model_canny = apply_canny
	result = model_canny(img, l, h)
	return remove_pad(result), True



	def hed(img, res=512, **kwargs):
	img, remove_pad = resize_image_with_pad(img, res)
	model_hed = apply_hed
	result = model_hed(img)
	return remove_pad(result), True


	def hed_safe(img, res=512, **kwargs):
	img, remove_pad = resize_image_with_pad(img, res)
	model_hed = apply_hed
	result = model_hed(img, is_safe=True)
	return remove_pad(result), True

	def midas(img, res=512, a=np.pi * 2.0, **kwargs):
	img, remove_pad = resize_image_with_pad(img, res)
	model_midas = apply_midas
	result, _ = model_midas(img, a)
	return remove_pad(result), True


	def leres(img, res=512, thr_a=0, thr_b=0, boost=False, **kwargs):
	img, remove_pad = resize_image_with_pad(img, res)
	model_leres = apply_leres
	result = model_leres(img, thr_a, thr_b, boost=boost)
	return remove_pad(result), True

	def lerespp(img, res=512, thr_a=0, thr_b=0, boost=True, **kwargs):
	img, remove_pad = resize_image_with_pad(img, res)
	model_leres = apply_leres
	result = model_leres(img, thr_a, thr_b, boost=boost)
	return remove_pad(result), True


	def pidinet(img, res=512, **kwargs):
	img, remove_pad = resize_image_with_pad(img, res)
	model_pidinet = apply_pidinet
	result = model_pidinet(img)
	return remove_pad(result), True


	def pidinet_ts(img, res=512, **kwargs):
	img, remove_pad = resize_image_with_pad(img, res)
	model_pidinet = apply_pidinet
	result = model_pidinet(img, apply_fliter=True)
	return remove_pad(result), True


	def pidinet_safe(img, res=512, **kwargs):
	img, remove_pad = resize_image_with_pad(img, res)
	model_pidinet = apply_pidinet
	result = model_pidinet(img, is_safe=True)
	return remove_pad(result), True



	def zoe_depth(img, res=512, **kwargs):
	img, remove_pad = resize_image_with_pad(img, res)
	model_zoe_depth = ZoeDetector()
	result = model_zoe_depth(img)
	return remove_pad(result), True


	preprocessors_dict = {
	'lineart_realistic': lineart,
	'lineart_coarse': lineart_coarse,
	'lineart_standard': lineart_standard,
	'lineart_anime': lineart_anime,
	'lineart_anime_denoise': lineart_anime_denoise,
	'softedge_hed': hed,
	'softedge_hedsafe': hed_safe,
	'softedge_pidinet': pidinet,
	'softedge_pidsafe': pidinet_safe,
	'canny': canny,
	'depth_leres': leres,
	'depth_leres++': lerespp,
	'depth_midas': midas,
	'depth_zoe': zoe_depth,
	}

	def pixel_perfect_process(input_image, p_name):
	raw_H, raw_W, _ = input_image.shape
	preprocessor_resolution = raw_H
	detected_map, _ = preprocessors_dict[p_name](input_image, res=preprocessor_resolution)
	return detected_map