Spaces:

rbanfield
/

receptacle_detection

Sleeping

App Files Files Community

receptacle_detection / app.py

rbanfield

Continue the rework... now mostly passable

1ee9349 almost 2 years ago

raw

history blame contribute delete

5.86 kB

	import torch
	import gradio as gr
	import cv2
	import numpy as np
	from sahi.utils.yolov5 import download_yolov5s6_model

	# import required functions, classes
	from sahi import AutoDetectionModel
	from sahi.predict import get_sliced_prediction, visualize_object_predictions

	# Autodetect GPU
	if torch.cuda.is_available():
	device = torch.device("cuda")
	else:
	device = torch.device("cpu")

	# Load the model
	yolov5_model_path = "best.pt"
	download_yolov5s6_model(destination_path=yolov5_model_path)
	detection_model = AutoDetectionModel.from_pretrained(
	model_type="yolov5",
	model_path=yolov5_model_path,
	confidence_threshold=0.01,
	device=device,
	)


	def do_detection(image_path, hide_labels, confidence_scores):

	# Obtain detection results
	result = get_sliced_prediction(
	image_path,
	detection_model,
	slice_height=512,
	slice_width=512,
	overlap_height_ratio=0.12,
	overlap_width_ratio=0.12,
	)

	# Filter detections according to the slider and count the number of classes
	# for visualization
	predictions = []
	class_counts = {}
	for i in result.object_prediction_list:
	score = i.score
	value = score.value
	category = i.category
	category_name = category.name
	if value > confidence_scores[category_name]:
	predictions.append(i)
	if i.category.name not in class_counts:
	class_counts[i.category.name] = 1
	else:
	class_counts[i.category.name] += 1

	# Draw the boxes and labels on top of the image
	img_rgb = visualize_object_predictions(
	image_path,
	object_prediction_list=predictions,
	text_size=1,
	text_th=1,
	hide_labels=hide_labels,
	rect_th=3,
	)["image"]

	# Construct a legend
	legend_text = "Symbols Counted:"
	for class_name, count in class_counts.items():
	legend_text += f" {class_name}: {count} \|"

	font = cv2.FONT_HERSHEY_SIMPLEX
	if hide_labels:
	font_scale = 1.5
	else:
	font_scale = 1
	font_color = (255, 255, 255)
	font_thickness = 2
	legend_bg_color = (131, 79, 0)
	legend_padding = 10

	legend_size, _ = cv2.getTextSize(legend_text, font, font_scale, font_thickness)
	legend_bg_height = legend_size[1] + 2 * legend_padding
	legend_bg_width = legend_size[0] + 2 * legend_padding

	legend_bg = np.zeros((legend_bg_height, legend_bg_width, 3), dtype=np.uint8)
	legend_bg[:] = legend_bg_color
	cv2.putText(
	legend_bg,
	legend_text,
	(legend_padding, legend_padding + legend_size[1]),
	font,
	font_scale,
	font_color,
	font_thickness,
	)

	img_height, img_width, _ = img_rgb.shape
	legend_x = img_width - legend_bg_width
	legend_y = img_height - legend_bg_height

	img_rgb[legend_y:, legend_x:, :] = legend_bg

	return (
	img_rgb,
	result.to_coco_predictions(),
	)


	def call_func(
	image_path,
	hide_labels,
	singleplex_value,
	duplex_value,
	triplex_value,
	quadruplex_value,
	gfci_value,
	gfci_wp_value,
	):
	confidence_scores = {
	"Singleplex - Standard": singleplex_value,
	"Duplex - Standard": duplex_value,
	"Triplex - Standard": triplex_value,
	"Quadruplex - Standard": quadruplex_value,
	"Duplex - GFCI": gfci_value,
	"Duplex - Weatherproof-GFCI": gfci_wp_value,
	}
	return do_detection(image_path, hide_labels, confidence_scores)


	demo = gr.Blocks()
	theme = gr.themes.Soft()

	with gr.Blocks(theme=theme) as demo:
	gr.Markdown(
	"""
	<h1 align="center">Receptacle Detector for Takeoff Automation</h1>
	"""
	)

	with gr.Row():
	input_image = gr.Image(
	label="Upload an image here.",
	source="upload",
	interactive=True,
	)
	examples = gr.Examples(
	examples=[
	["test1.jpg"],
	["test2.jpg"],
	["test3.jpg"],
	["test4.jpg"],
	],
	inputs=[input_image],
	examples_per_page=4,
	label="Examples to use.",
	)

	hide_labels = gr.Checkbox(label="Hide labels")
	with gr.Accordion("Visualization Confidence Thresholds", open=False):
	singleplex_slider = gr.Slider(
	minimum=0.1,
	maximum=1,
	value=0.53,
	interactive=True,
	label="Singleplex",
	)
	duplex_slider = gr.Slider(
	minimum=0.1,
	maximum=1,
	value=0.66,
	interactive=True,
	label="Duplex",
	)
	triplex_slider = gr.Slider(
	minimum=0.1,
	maximum=1,
	value=0.65,
	interactive=True,
	label="Triplex",
	)
	quadruplex_slider = gr.Slider(
	minimum=0.1,
	maximum=1,
	value=0.63,
	interactive=True,
	label="Quadruplex",
	)
	gfci_slider = gr.Slider(
	minimum=0.1,
	maximum=1,
	value=0.31,
	interactive=True,
	label="GFCI",
	)
	gfci_wp_slider = gr.Slider(
	minimum=0.1,
	maximum=1,
	value=0.33,
	interactive=True,
	label="GFCI/WP",
	)

	results_button = gr.Button("Submit")
	results_button.click(
	call_func,
	inputs=[
	input_image,
	hide_labels,
	singleplex_slider,
	duplex_slider,
	triplex_slider,
	quadruplex_slider,
	gfci_slider,
	gfci_wp_slider,
	],
	outputs=[
	gr.Image(type="numpy", label="Output Image"),
	gr.Json(),
	],
	)

	demo.launch()