Spaces:

noahzhy
/

KR_LPR

Running

App Files Files

KR_LPR / app.py

noahzhy

Refactor inference function and add preprocessing

5bfef7f about 1 year ago

raw

history blame

4.64 kB

	import os
	import glob
	from itertools import groupby

	import cv2
	import numpy as np
	import gradio as gr
	import tensorflow as tf


	def get_sample_images():
	list_ = glob.glob(os.path.join(os.path.dirname(__file__), 'samples/*.jpg'))
	# sort by name
	list_.sort(key=lambda x: int(x.split('/')[-1].split('.')[0]))
	return [[i] for i in list_]


	def cv2_imread(path):
	return cv2.imdecode(np.fromfile(path, dtype=np.uint8), cv2.IMREAD_UNCHANGED)


	def decode_label(mat, chars) -> str:
	# mat is the output of model
	# get char indices along best path
	best_path_indices = np.argmax(mat[0], axis=-1)
	# collapse best path (using itertools.groupby), map to chars, join char list to string
	best_chars_collapsed = [chars[k] for k, _ in groupby(best_path_indices) if k != len(chars)]
	res = ''.join(best_chars_collapsed)
	# remove space and '_'
	res = res.replace(' ', '').replace('_', '')
	return res


	def center_fit(img, w, h, inter=cv2.INTER_NEAREST, top_left=True):
	# get img shape
	img_h, img_w = img.shape[:2]
	# get ratio
	ratio = min(w / img_w, h / img_h)

	if len(img.shape) == 3:
	inter = cv2.INTER_AREA
	# resize img
	img = cv2.resize(img, (int(img_w * ratio), int(img_h * ratio)), interpolation=inter)
	# get new img shape
	img_h, img_w = img.shape[:2]
	# get start point
	start_w = (w - img_w) // 2
	start_h = (h - img_h) // 2

	if top_left:
	start_w = 0
	start_h = 0

	if len(img.shape) == 2:
	# create new img
	new_img = np.zeros((h, w), dtype=np.uint8)
	new_img[start_h:start_h+img_h, start_w:start_w+img_w] = img
	else:
	new_img = np.zeros((h, w, 3), dtype=np.uint8)
	new_img[start_h:start_h+img_h, start_w:start_w+img_w, :] = img

	return new_img


	def load_dict(dict_path='label.names'):
	with open(dict_path, 'r', encoding='utf-8') as f:
	dict = f.read().splitlines()
	dict = {i: dict[i] for i in range(len(dict))}
	return dict


	class TFliteDemo:
	def __init__(self, model_path, blank=85, conf_mode="mean"):
	self.blank = blank
	self.conf_mode = conf_mode
	self.interpreter = tf.lite.Interpreter(model_path=model_path)
	self.interpreter.allocate_tensors()
	self.input_details = self.interpreter.get_input_details()
	self.output_details = self.interpreter.get_output_details()

	def inference(self, x):
	self.interpreter.set_tensor(self.input_details[0]['index'], x)
	self.interpreter.invoke()
	return self.interpreter.get_tensor(self.output_details[0]['index'])

	def preprocess(self, img):
	if isinstance(img, str):
	image = cv2_imread(img)
	else:
	image = img
	image = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
	image = center_fit(image, 128, 64, top_left=True)
	image = np.reshape(image, (1, *image.shape, 1)).astype(np.uint8)
	return image

	def get_confidence(self, pred, mode="mean"):
	conf = []
	idxs = np.argmax(pred, axis=-1)
	values = np.max(pred, axis=-1)

	for idx, c in zip(idxs, values):
	if idx == self.blank: continue
	conf.append(c/255)

	if mode == "min":
	return np.min(conf)

	return np.mean(conf)

	def postprocess(self, pred):
	label = decode_label(pred, load_dict())
	conf = self.get_confidence(pred[0], mode=self.conf_mode)
	# keep 4 decimal places
	conf = float('{:.4f}'.format(conf))
	return label, conf


	def inference(img):
	# preprocess
	img = demo.preprocess(img)
	# inference
	pred = demo.inference(img)
	# postprocess
	label, conf = demo.postprocess(pred)
	return label, conf


	if __name__ == '__main__':
	_TITLE = '''South Korean License Plate Recognition'''
	_DESCRIPTION = '''
	<div>
	<p style="text-align: center; font-size: 1.3em">This is a demo of South Korean License Plate Recognition.
	<a style="display:inline-block; margin-left: .5em" href='https://github.com/noahzhy/KR_LPR_TF/'><img src='https://img.shields.io/github/stars/noahzhy/KR_LPR_TF?style=social' /></a>
	</p>
	</div>
	'''
	# init model
	demo = TFliteDemo(os.path.join(os.path.dirname(__file__), 'model.tflite'))
	interface = gr.Interface(
	fn=inference,
	inputs="image",
	outputs=[
	gr.Textbox(label="Plate Number", type="text"),
	gr.Textbox(label="Confidence", type="text"),
	],
	title=_TITLE,
	description=_DESCRIPTION,
	examples=get_sample_images(),
	)
	interface.launch()