Spaces:

automi
/

keypoint-demo

Runtime error

keypoint-demo / app.py

Jyothish CHANDRASENAN

Update app.py

df7600a about 2 years ago

7.01 kB


	import gradio as gr
	import cv2
	import numpy as np
	import onnxruntime as ort
	import json
	import os
	import csv
	import shutil
	import matplotlib.pyplot as plt
	import copy

	# path to the model
	MODEL_PATH = "./model_keypoints_v3.onnx"
	IMG_SIZE = (224, 224)


	MAX_VALUES_BY_DTYPE = {
	np.dtype("uint8"): 255,
	np.dtype("uint16"): 65535,
	np.dtype("uint32"): 4294967295,
	np.dtype("float32"): 1.0,
	}

	def to_float(img, max_value=None):
	if max_value is None:
	try:
	max_value = MAX_VALUES_BY_DTYPE[img.dtype]
	except KeyError:
	raise RuntimeError(
	"Can't infer the maximum value for dtype {}. You need to specify the maximum value manually by "
	"passing the max_value argument".format(img.dtype)
	)
	return img.astype("float32") / max_value

	def preprocessor(img):
	# Load image and preprocess
	original_img = cv2.resize(img, IMG_SIZE)
	original_img = cv2.cvtColor(original_img, cv2.COLOR_BGR2RGB)
	preprocessed = to_float(original_img)
	preprocessed = np.moveaxis(preprocessed,-1,0)
	preprocessed = np.expand_dims(preprocessed, axis=0)
	preprocessed = np.asarray(preprocessed, dtype=np.float32)
	return preprocessed, original_img

	def nms(bounding_boxes, confidence_score, threshold):
	# If no bounding boxes, return empty list
	if len(bounding_boxes) == 0:
	return [], []

	# Bounding boxes
	boxes = np.array(bounding_boxes)

	# coordinates of bounding boxes
	start_x = boxes[:, 0]
	start_y = boxes[:, 1]
	end_x = boxes[:, 2]
	end_y = boxes[:, 3]

	# Confidence scores of bounding boxes
	score = np.array(confidence_score)

	# Picked bounding boxes
	picked_boxes = []
	picked_score = []
	picked_boxes_idx = []

	# Compute areas of bounding boxes
	areas = (end_x - start_x + 1) * (end_y - start_y + 1)

	# Sort by confidence score of bounding boxes
	order = np.argsort(score)

	# Iterate bounding boxes
	while order.size > 0:
	# The index of largest confidence score
	index = order[-1]

	# Pick the bounding box with largest confidence score
	picked_boxes.append(bounding_boxes[index])
	picked_boxes_idx.append(index)
	picked_score.append(confidence_score[index])

	# Compute ordinates of intersection-over-union(IOU)
	x1 = np.maximum(start_x[index], start_x[order[:-1]])
	x2 = np.minimum(end_x[index], end_x[order[:-1]])
	y1 = np.maximum(start_y[index], start_y[order[:-1]])
	y2 = np.minimum(end_y[index], end_y[order[:-1]])

	# Compute areas of intersection-over-union
	w = np.maximum(0.0, x2 - x1 + 1)
	h = np.maximum(0.0, y2 - y1 + 1)
	intersection = w * h

	# Compute the ratio between intersection and union
	ratio = intersection / (areas[index] + areas[order[:-1]] - intersection)

	left = np.where(ratio < threshold)
	order = order[left]

	return picked_boxes_idx, picked_boxes, picked_score

	def postprocessor(prediction, orig_img):
	boxes = prediction[0]
	scores = prediction[1]
	keypoints = prediction[2]
	high_scores_idxs = np.where(scores > 0.7)[0].tolist()
	post_nms_idxs, best_boxes, best_scores = nms(boxes[high_scores_idxs], scores[high_scores_idxs], 0.3)
	keypoints_picked = keypoints[high_scores_idxs]
	keypoints = []
	for kps in keypoints_picked[post_nms_idxs]:
	keypoints.append([list(map(int, kp[:2])) for kp in kps])
	img_copy = copy.deepcopy(orig_img)
	result_image = None
	text = ["A", "B"]
	points = list()
	for bbox in best_boxes:
	start_point = (int(bbox[0]), int(bbox[1]))
	end_point = (int(bbox[2]), int(bbox[3]))
	color = (0, 255, 0)
	thickness = 1
	#crop_img = img_copy[int(bbox[0]):int(bbox[2]), int(bbox[1]):int(bbox[3])]
	result_image = cv2.rectangle(img_copy, start_point, end_point, color, thickness)
	for ab in keypoints:
	for idx, point in enumerate(ab):
	x = int(point[0])
	y = int(point[1])
	points.append((x,y))
	color = (255, 0, 0)
	thickness = 3
	result_image = cv2.circle(result_image, (x,y), radius=0, color=color, thickness=thickness)
	result_image = cv2.putText(result_image,text[idx], (x+2,y-5), cv2.FONT_HERSHEY_SIMPLEX, 0.35, (255,0,0), 1, cv2.LINE_AA)

	distance = distanceCalculate(points[0], points[1])
	midpoints = midpoint(points[0], points[1])
	result_image = cv2.line(result_image, points[0], points[1], (0,0,255), 1)
	# result_image = cv2.putText(result_image,str(distance), (midpoints[0],midpoints[0]+10), cv2.FONT_HERSHEY_SIMPLEX, 0.40, (0,0,255), 1, cv2.LINE_AA)
	return result_image, distance

	def distanceCalculate(p1, p2):
	"""p1 and p2 in format (x1,y1) and (x2,y2) tuples"""
	dis = round(((p2[0] - p1[0]) 2 + (p2[1] - p1[1]) 2) ** 0.5, 2)
	return dis

	# midpoint of a line
	def midpoint(p1, p2):

	mid_x = (p1[0] + p1[1]) // 2
	mid_y = (p2[0] + p2[1]) // 2
	midpoints = (mid_x,mid_y)

	return midpoints

	def infer(preprocessed):

	ort_sess = ort.InferenceSession(MODEL_PATH, providers = [('CUDAExecutionProvider')])
	input_name = ort_sess.get_inputs()[0].name
	boxes = ort_sess.get_outputs()[0].name
	scores = ort_sess.get_outputs()[2].name
	keypoints = ort_sess.get_outputs()[3].name
	prediction = ort_sess.run([boxes, scores, keypoints], {input_name: preprocessed})
	#prediction = prediction[0].squeeze()

	return prediction


	def predict(img):

	raw_img = cv2.imread(img)
	# preprocess
	preprocessed_img, orig_img = preprocessor(raw_img)
	# infer
	prediction = infer(preprocessed_img)
	keypoints_map, distance_keypoints = postprocessor(prediction, orig_img)
	# cv2.imwrite("keypoints_map.png", keypoints_map[:,:,::-1])

	if distance_keypoints > 96:
	display_text = f"Transistor détecté \nLa distance entre les 2 pattes est de {distance_keypoints} \nCette côte dimensionnelle est conforme et dans les tolérances"
	else:
	display_text = f"Transistor détecté \nLa distance entre les 2 pattes est de {distance_keypoints} \nCette côte dimensionnelle n'est pas conforme et est hors tolérance"

	return keypoints_map, display_text

	sample_images = [["006.png"],["002.png"],["003.png"],["004.png"],["058.png"],["001.png"],["011.png"],["012.png"],["013.png"],["014.png"]]
	gr.Interface(fn=predict,
	inputs=[gr.Image(label="image à tester" ,type="filepath")],
	outputs=[gr.Image(label ="résultat"), gr.Textbox(label="analyse")],
	#css="footer {visibility: hidden} body}, .gradio-container {background-color: white}",
	# examples = [gr.Examples(sample_images, inputs=[gr.Image(label="image à tester" ,type="filepath")], label = "Quelques images à tester")]).launch(share=False)
	examples=sample_images).launch(share=False)