Spaces:

palondomus
/

CaesarAI

Sleeping

CaesarAI / CaesarObjectDetection /utils.py

CaesarCloudSync

CaesarAI Deployed

9d3162f almost 2 years ago

9.97 kB

	import time
	import torch
	import numpy as np
	import matplotlib.pyplot as plt
	import matplotlib.patches as patches


	def boxes_iou(box1, box2):
	"""
	Returns the IOU between `box1` and `box2` (i.e intersection area divided by union area)
	"""
	# Get the Width and Height of each bounding box
	width_box1 = box1[2]
	height_box1 = box1[3]
	width_box2 = box2[2]
	height_box2 = box2[3]

	# Calculate the area of the each bounding box
	area_box1 = width_box1 * height_box1
	area_box2 = width_box2 * height_box2

	# Find the vertical edges of the union of the two bounding boxes
	mx = min(box1[0] - width_box1/2.0, box2[0] - width_box2/2.0)
	Mx = max(box1[0] + width_box1/2.0, box2[0] + width_box2/2.0)

	# Calculate the width of the union of the two bounding boxes
	union_width = Mx - mx

	# Find the horizontal edges of the union of the two bounding boxes
	my = min(box1[1] - height_box1/2.0, box2[1] - height_box2/2.0)
	My = max(box1[1] + height_box1/2.0, box2[1] + height_box2/2.0)

	# Calculate the height of the union of the two bounding boxes
	union_height = My - my

	# Calculate the width and height of the area of intersection of the two bounding boxes
	intersection_width = width_box1 + width_box2 - union_width
	intersection_height = height_box1 + height_box2 - union_height

	# If the the boxes don't overlap then their IOU is zero
	if intersection_width <= 0 or intersection_height <= 0:
	return 0.0

	# Calculate the area of intersection of the two bounding boxes
	intersection_area = intersection_width * intersection_height

	# Calculate the area of the union of the two bounding boxes
	union_area = area_box1 + area_box2 - intersection_area

	# Calculate the IOU
	iou = intersection_area/union_area

	return iou


	def nms(boxes, iou_thresh):
	"""
	Performs Non maximal suppression technique to `boxes` using `iou_thresh` threshold
	"""
	# print(boxes.shape)
	# If there are no bounding boxes do nothing
	if len(boxes) == 0:
	return boxes

	# Create a PyTorch Tensor to keep track of the detection confidence
	# of each predicted bounding box
	det_confs = torch.zeros(len(boxes))

	# Get the detection confidence of each predicted bounding box
	for i in range(len(boxes)):
	det_confs[i] = boxes[i][4]

	# Sort the indices of the bounding boxes by detection confidence value in descending order.
	# We ignore the first returned element since we are only interested in the sorted indices
	_,sortIds = torch.sort(det_confs, descending = True)

	# Create an empty list to hold the best bounding boxes after
	# Non-Maximal Suppression (NMS) is performed
	best_boxes = []

	# Perform Non-Maximal Suppression
	for i in range(len(boxes)):

	# Get the bounding box with the highest detection confidence first
	box_i = boxes[sortIds[i]]

	# Check that the detection confidence is not zero
	if box_i[4] > 0:

	# Save the bounding box
	best_boxes.append(box_i)

	# Go through the rest of the bounding boxes in the list and calculate their IOU with
	# respect to the previous selected box_i.
	for j in range(i + 1, len(boxes)):
	box_j = boxes[sortIds[j]]

	# If the IOU of box_i and box_j is higher than the given IOU threshold set
	# box_j's detection confidence to zero.
	if boxes_iou(box_i, box_j) > iou_thresh:
	box_j[4] = 0

	return best_boxes


	def detect_objects(model, img, iou_thresh, nms_thresh):

	# Start the time. This is done to calculate how long the detection takes.
	start = time.time()

	# Set the model to evaluation mode.
	model.eval()

	# Convert the image from a NumPy ndarray to a PyTorch Tensor of the correct shape.
	# The image is transposed, then converted to a FloatTensor of dtype float32, then
	# Normalized to values between 0 and 1, and finally unsqueezed to have the correct
	# shape of 1 x 3 x 416 x 416
	img = torch.from_numpy(img.transpose(2,0,1)).float().div(255.0).unsqueeze(0)

	# Feed the image to the neural network with the corresponding NMS threshold.
	# The first step in NMS is to remove all bounding boxes that have a very low
	# probability of detection. All predicted bounding boxes with a value less than
	# the given NMS threshold will be removed.
	list_boxes = model(img, nms_thresh)

	# Make a new list with all the bounding boxes returned by the neural network
	boxes = list_boxes[0][0] + list_boxes[1][0] + list_boxes[2][0]

	# Perform the second step of NMS on the bounding boxes returned by the neural network.
	# In this step, we only keep the best bounding boxes by eliminating all the bounding boxes
	# whose IOU value is higher than the given IOU threshold
	boxes = nms(boxes, iou_thresh)

	# Stop the time.
	finish = time.time()

	# Print the time it took to detect objects
	print('\n\nIt took {:.3f}'.format(finish - start), 'seconds to detect the objects in the image.\n')

	# Print the number of objects detected
	print('Number of Objects Detected:', len(boxes), '\n')

	return boxes


	def load_class_names(namesfile):

	# Create an empty list to hold the object classes
	class_names = []

	# Open the file containing the COCO object classes in read-only mode
	with open(namesfile, 'r') as fp:

	# The coco.names file contains only one object class per line.
	# Read the file line by line and save all the lines in a list.
	lines = fp.readlines()

	# Get the object class names
	for line in lines:

	# Make a copy of each line with any trailing whitespace removed
	line = line.rstrip()

	# Save the object class name into class_names
	class_names.append(line)

	return class_names


	def print_objects(boxes, class_names):
	print('Objects Found and Confidence Level:\n')
	for i in range(len(boxes)):
	box = boxes[i]
	if len(box) >= 7 and class_names:
	cls_conf = box[5]
	cls_id = box[6]
	print('%i. %s: %f' % (i + 1, class_names[cls_id], cls_conf))


	def plot_boxes(img, boxes, class_names, plot_labels, color = None):

	# Define a tensor used to set the colors of the bounding boxes
	colors = torch.FloatTensor([[1,0,1],[0,0,1],[0,1,1],[0,1,0],[1,1,0],[1,0,0]])

	# Define a function to set the colors of the bounding boxes
	def get_color(c, x, max_val):
	ratio = float(x) / max_val * 5
	i = int(np.floor(ratio))
	j = int(np.ceil(ratio))

	ratio = ratio - i
	r = (1 - ratio) * colors[i][c] + ratio * colors[j][c]

	return int(r * 255)

	# Get the width and height of the image
	width = img.shape[1]
	height = img.shape[0]

	# Create a figure and plot the image
	fig, a = plt.subplots(1,1)
	a.imshow(img)

	# Plot the bounding boxes and corresponding labels on top of the image
	for i in range(len(boxes)):

	# Get the ith bounding box
	box = boxes[i]

	# Get the (x,y) pixel coordinates of the lower-left and lower-right corners
	# of the bounding box relative to the size of the image.
	x1 = int(np.around((box[0] - box[2]/2.0) * width))
	y1 = int(np.around((box[1] - box[3]/2.0) * height))
	x2 = int(np.around((box[0] + box[2]/2.0) * width))
	y2 = int(np.around((box[1] + box[3]/2.0) * height))

	# Set the default rgb value to red
	rgb = (1, 0, 0)

	# Use the same color to plot the bounding boxes of the same object class
	if len(box) >= 7 and class_names:
	cls_conf = box[5]
	cls_id = box[6]
	classes = len(class_names)
	offset = cls_id * 123457 % classes
	red = get_color(2, offset, classes) / 255
	green = get_color(1, offset, classes) / 255
	blue = get_color(0, offset, classes) / 255

	# If a color is given then set rgb to the given color instead
	if color is None:
	rgb = (red, green, blue)
	else:
	rgb = color

	# Calculate the width and height of the bounding box relative to the size of the image.
	width_x = x2 - x1
	width_y = y1 - y2

	# Set the postion and size of the bounding box. (x1, y2) is the pixel coordinate of the
	# lower-left corner of the bounding box relative to the size of the image.
	rect = patches.Rectangle((x1, y2),
	width_x, width_y,
	linewidth = 2,
	edgecolor = rgb,
	facecolor = 'none')

	# Draw the bounding box on top of the image
	a.add_patch(rect)

	# If plot_labels = True then plot the corresponding label
	if plot_labels:

	# Create a string with the object class name and the corresponding object class probability
	conf_tx = class_names[cls_id] + ': {:.1f}'.format(cls_conf)

	# Define x and y offsets for the labels
	lxc = (img.shape[1] * 0.266) / 100
	lyc = (img.shape[0] * 1.180) / 100

	# Draw the labels on top of the image
	a.text(x1 + lxc, y1 - lyc, conf_tx, fontsize = 12, color = 'k',
	bbox = dict(facecolor = rgb, edgecolor = rgb, alpha = 0.6))

	plt.axis("off")
	plt.savefig("output.jpg")
	plt.show()