yolov5s / utils.py

Upload 10 files

8a60c6f 12 months ago

53.1 kB

	import onnxruntime
	import numpy as np
	import onnx
	import copy
	import cv2
	from pathlib import Path
	import matplotlib.pyplot as plt
	import torch
	import time
	import torchvision
	import re
	import glob
	from contextlib import contextmanager
	from torch.utils.data import Dataset
	import yaml
	import os
	from multiprocessing.pool import ThreadPool, Pool
	from tqdm import tqdm
	from itertools import repeat
	import logging
	from PIL import Image, ExifTags
	import hashlib
	import shutil
	import sys
	import pathlib
	CURRENT_DIR = pathlib.Path(__file__).parent
	sys.path.append(str(CURRENT_DIR))
	# Parameters
	IMG_FORMATS = ['bmp', 'jpg', 'jpeg', 'png', 'tif', 'tiff', 'dng', 'webp', 'mpo']
	NUM_THREADS = min(8, os.cpu_count())
	img_formats = IMG_FORMATS # acceptable image suffixes
	vid_formats = ['mov', 'avi', 'mp4', 'mpg', 'mpeg', 'm4v', 'wmv', 'mkv'] # acceptable video suffixes

	# Get orientation exif tag
	for orientation in ExifTags.TAGS.keys():
	if ExifTags.TAGS[orientation] == 'Orientation':
	break


	def make_dirs(dir='./datasets/coco'):
	# Create folders
	dir = Path(dir)
	for p in [dir / 'labels']:
	p.mkdir(parents=True, exist_ok=True) # make dir
	return dir


	def coco91_to_coco80_class(): # converts 80-index (val2014) to 91-index (paper)
	# https://tech.amikelive.com/node-718/what-object-categories-labels-are-in-coco-dataset/
	x = [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, None, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, None, 24, 25, None,
	None, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, None, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50,
	51, 52, 53, 54, 55, 56, 57, 58, 59, None, 60, None, None, 61, None, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72,
	None, 73, 74, 75, 76, 77, 78, 79, None]
	return x


	def is_ascii(s=""):
	# Is string composed of all ASCII (no UTF) characters? (note str().isascii() introduced in python 3.7)
	s = str(s) # convert list, tuple, None, etc. to str
	return len(s.encode().decode("ascii", "ignore")) == len(s)


	def is_chinese(s="人工智能"):
	# Is string composed of any Chinese characters?
	return re.search("[\u4e00-\u9fff]", s)


	def letterbox(
	im,
	new_shape=(640, 640),
	color=(114, 114, 114),
	auto=True,
	scaleFill=False,
	scaleup=True,
	stride=32,
	):
	# Resize and pad image while meeting stride-multiple constraints
	shape = im.shape[:2] # current shape [height, width]
	if isinstance(new_shape, int):
	new_shape = (new_shape, new_shape)

	# Scale ratio (new / old)
	r = min(new_shape[0] / shape[0], new_shape[1] / shape[1])
	if not scaleup: # only scale down, do not scale up (for better val mAP)
	r = min(r, 1.0)

	# Compute padding
	ratio = r, r # width, height ratios
	new_unpad = int(round(shape[1] * r)), int(round(shape[0] * r))
	dw, dh = new_shape[1] - new_unpad[0], new_shape[0] - new_unpad[1] # wh padding
	if auto: # minimum rectangle
	dw, dh = np.mod(dw, stride), np.mod(dh, stride) # wh padding
	elif scaleFill: # stretch
	dw, dh = 0.0, 0.0
	new_unpad = (new_shape[1], new_shape[0])
	ratio = new_shape[1] / shape[1], new_shape[0] / shape[0] # width, height ratios

	dw /= 2 # divide padding into 2 sides
	dh /= 2

	if shape[::-1] != new_unpad: # resize
	im = cv2.resize(im, new_unpad, interpolation=cv2.INTER_LINEAR)
	top, bottom = int(round(dh - 0.1)), int(round(dh + 0.1))
	left, right = int(round(dw - 0.1)), int(round(dw + 0.1))
	im = cv2.copyMakeBorder(
	im, top, bottom, left, right, cv2.BORDER_CONSTANT, value=color
	) # add border
	return im, ratio, (dw, dh)


	def xyxy2xywh(x):
	# Convert nx4 boxes from [x1, y1, x2, y2] to [x, y, w, h] where xy1=top-left, xy2=bottom-right
	y = x.clone() if isinstance(x, torch.Tensor) else np.copy(x)
	y[:, 0] = (x[:, 0] + x[:, 2]) / 2 # x center
	y[:, 1] = (x[:, 1] + x[:, 3]) / 2 # y center
	y[:, 2] = x[:, 2] - x[:, 0] # width
	y[:, 3] = x[:, 3] - x[:, 1] # height
	return y


	def xywh2xyxy(x):
	# Convert nx4 boxes from [x, y, w, h] to [x1, y1, x2, y2] where xy1=top-left, xy2=bottom-right
	y = x.clone() if isinstance(x, torch.Tensor) else np.copy(x)
	y[:, 0] = x[:, 0] - x[:, 2] / 2 # top left x
	y[:, 1] = x[:, 1] - x[:, 3] / 2 # top left y
	y[:, 2] = x[:, 0] + x[:, 2] / 2 # bottom right x
	y[:, 3] = x[:, 1] + x[:, 3] / 2 # bottom right y
	return y


	def non_max_suppression(
	prediction,
	conf_thres=0.25,
	iou_thres=0.45,
	classes=None,
	agnostic=False,
	multi_label=False,
	labels=(),
	max_det=300,
	):
	"""Runs Non-Maximum Suppression (NMS) on inference results

	Returns:
	list of detections, on (n,6) tensor per image [xyxy, conf, cls]
	"""

	nc = prediction.shape[2] - 5 # number of classes
	xc = prediction[..., 4] > conf_thres # candidates

	# Checks
	assert (
	0 <= conf_thres <= 1
	), f"Invalid Confidence threshold {conf_thres}, valid values are between 0.0 and 1.0"
	assert (
	0 <= iou_thres <= 1
	), f"Invalid IoU {iou_thres}, valid values are between 0.0 and 1.0"

	# Settings
	min_wh, max_wh = 2, 4096 # (pixels) minimum and maximum box width and height
	max_nms = 30000 # maximum number of boxes into torchvision.ops.nms()
	time_limit = 10.0 # seconds to quit after
	redundant = True # require redundant detections
	multi_label &= nc > 1 # multiple labels per box (adds 0.5ms/img)
	merge = False # use merge-NMS

	t = time.time()
	output = [torch.zeros((0, 6), device=prediction.device)] * prediction.shape[0]
	for xi, x in enumerate(prediction): # image index, image inference
	# Apply constraints
	# x[((x[..., 2:4] < min_wh) \| (x[..., 2:4] > max_wh)).any(1), 4] = 0 # width-height
	x = x[xc[xi]] # confidence

	# Cat apriori labels if autolabelling
	if labels and len(labels[xi]):
	l = labels[xi]
	v = torch.zeros((len(l), nc + 5), device=x.device)
	v[:, :4] = l[:, 1:5] # box
	v[:, 4] = 1.0 # conf
	v[range(len(l)), l[:, 0].long() + 5] = 1.0 # cls
	x = torch.cat((x, v), 0)

	# If none remain process next image
	if not x.shape[0]:
	continue

	# Compute conf
	x[:, 5:] = x[:, 4:5] # conf = obj_conf cls_conf

	# Box (center x, center y, width, height) to (x1, y1, x2, y2)
	box = xywh2xyxy(x[:, :4])

	# Detections matrix nx6 (xyxy, conf, cls)
	if multi_label:
	i, j = (x[:, 5:] > conf_thres).nonzero(as_tuple=False).T
	x = torch.cat((box[i], x[i, j + 5, None], j[:, None].float()), 1)
	else: # best class only
	conf, j = x[:, 5:].max(1, keepdim=True)
	x = torch.cat((box, conf, j.float()), 1)[conf.view(-1) > conf_thres]

	# Filter by class
	if classes is not None:
	x = x[(x[:, 5:6] == torch.tensor(classes, device=x.device)).any(1)]

	# Apply finite constraint
	# if not torch.isfinite(x).all():
	# x = x[torch.isfinite(x).all(1)]

	# Check shape
	n = x.shape[0] # number of boxes
	if not n: # no boxes
	continue
	elif n > max_nms: # excess boxes
	x = x[x[:, 4].argsort(descending=True)[:max_nms]] # sort by confidence

	# Batched NMS
	c = x[:, 5:6] * (0 if agnostic else max_wh) # classes
	boxes, scores = x[:, :4] + c, x[:, 4] # boxes (offset by class), scores
	i = torchvision.ops.nms(boxes, scores, iou_thres) # NMS
	if i.shape[0] > max_det: # limit detections
	i = i[:max_det]
	if merge and (1 < n < 3e3): # Merge NMS (boxes merged using weighted mean)
	# update boxes as boxes(i,4) = weights(i,n) * boxes(n,4)
	iou = box_iou(boxes[i], boxes) > iou_thres # iou matrix
	weights = iou * scores[None] # box weights
	x[i, :4] = torch.mm(weights, x[:, :4]).float() / weights.sum(
	1, keepdim=True
	) # merged boxes
	if redundant:
	i = i[iou.sum(1) > 1] # require redundancy

	output[xi] = x[i]
	if (time.time() - t) > time_limit:
	print(f"WARNING: NMS time limit {time_limit}s exceeded")
	break # time limit exceeded

	return output


	def clip_coords(boxes, shape):
	# Clip bounding xyxy bounding boxes to image shape (height, width)
	if isinstance(boxes, torch.Tensor): # faster individually
	boxes[:, 0].clamp_(0, shape[1]) # x1
	boxes[:, 1].clamp_(0, shape[0]) # y1
	boxes[:, 2].clamp_(0, shape[1]) # x2
	boxes[:, 3].clamp_(0, shape[0]) # y2
	else: # np.array (faster grouped)
	boxes[:, [0, 2]] = boxes[:, [0, 2]].clip(0, shape[1]) # x1, x2
	boxes[:, [1, 3]] = boxes[:, [1, 3]].clip(0, shape[0]) # y1, y2


	def scale_coords(img1_shape, coords, img0_shape, ratio_pad=None):
	# Rescale coords (xyxy) from img1_shape to img0_shape
	if ratio_pad is None: # calculate from img0_shape
	gain = min(
	img1_shape[0] / img0_shape[0], img1_shape[1] / img0_shape[1]
	) # gain = old / new
	pad = (img1_shape[1] - img0_shape[1] * gain) / 2, (
	img1_shape[0] - img0_shape[0] * gain
	) / 2 # wh padding
	else:
	gain = ratio_pad[0][0]
	pad = ratio_pad[1]

	coords[:, [0, 2]] -= pad[0] # x padding
	coords[:, [1, 3]] -= pad[1] # y padding
	coords[:, :4] /= gain
	clip_coords(coords, img0_shape)
	return coords


	class Annotator:
	# YOLOv5 Annotator for train/val mosaics and jpgs and detect/hub inference annotations
	def __init__(
	self,
	im,
	line_width=None,
	font_size=None,
	font="Arial.ttf",
	pil=False,
	example="abc",
	):
	assert (
	im.data.contiguous
	), "Image not contiguous. Apply np.ascontiguousarray(im) to Annotator() input images."
	self.pil = pil or not is_ascii(example) or is_chinese(example)
	if self.pil: # use PIL
	self.im = im if isinstance(im, Image.Image) else Image.fromarray(im)
	self.draw = ImageDraw.Draw(self.im)
	self.font = check_font(
	font="Arial.Unicode.ttf" if is_chinese(example) else font,
	size=font_size or max(round(sum(self.im.size) / 2 * 0.035), 12),
	)
	else: # use cv2
	self.im = im
	self.lw = line_width or max(round(sum(im.shape) / 2 * 0.003), 2) # line width

	def box_label(
	self, box, label="", color=(128, 128, 128), txt_color=(255, 255, 255)
	):
	# Add one xyxy box to image with label
	if self.pil or not is_ascii(label):
	self.draw.rectangle(box, width=self.lw, outline=color) # box
	if label:
	w, h = self.font.getsize(label) # text width, height
	outside = box[1] - h >= 0 # label fits outside box
	self.draw.rectangle(
	[
	box[0],
	box[1] - h if outside else box[1],
	box[0] + w + 1,
	box[1] + 1 if outside else box[1] + h + 1,
	],
	fill=color,
	)
	# self.draw.text((box[0], box[1]), label, fill=txt_color, font=self.font, anchor='ls') # for PIL>8.0
	self.draw.text(
	(box[0], box[1] - h if outside else box[1]),
	label,
	fill=txt_color,
	font=self.font,
	)
	else: # cv2
	p1, p2 = (int(box[0]), int(box[1])), (int(box[2]), int(box[3]))
	cv2.rectangle(
	self.im, p1, p2, color, thickness=self.lw, lineType=cv2.LINE_AA
	)
	if label:
	tf = max(self.lw - 1, 1) # font thickness
	w, h = cv2.getTextSize(label, 0, fontScale=self.lw / 3, thickness=tf)[
	0
	] # text width, height
	outside = p1[1] - h - 3 >= 0 # label fits outside box
	p2 = p1[0] + w, p1[1] - h - 3 if outside else p1[1] + h + 3
	cv2.rectangle(self.im, p1, p2, color, -1, cv2.LINE_AA) # filled
	cv2.putText(
	self.im,
	label,
	(p1[0], p1[1] - 2 if outside else p1[1] + h + 2),
	0,
	self.lw / 3,
	txt_color,
	thickness=tf,
	lineType=cv2.LINE_AA,
	)

	def rectangle(self, xy, fill=None, outline=None, width=1):
	# Add rectangle to image (PIL-only)
	self.draw.rectangle(xy, fill, outline, width)

	def text(self, xy, text, txt_color=(255, 255, 255)):
	# Add text to image (PIL-only)
	w, h = self.font.getsize(text) # text width, height
	self.draw.text((xy[0], xy[1] - h + 1), text, fill=txt_color, font=self.font)

	def result(self):
	# Return annotated image as array
	return np.asarray(self.im)


	class Colors:
	# Ultralytics color palette https://ultralytics.com/
	def __init__(self):
	# hex = matplotlib.colors.TABLEAU_COLORS.values()
	hex = (
	"FF3838",
	"FF9D97",
	"FF701F",
	"FFB21D",
	"CFD231",
	"48F90A",
	"92CC17",
	"3DDB86",
	"1A9334",
	"00D4BB",
	"2C99A8",
	"00C2FF",
	"344593",
	"6473FF",
	"0018EC",
	"8438FF",
	"520085",
	"CB38FF",
	"FF95C8",
	"FF37C7",
	)
	self.palette = [self.hex2rgb("#" + c) for c in hex]
	self.n = len(self.palette)

	def __call__(self, i, bgr=False):
	c = self.palette[int(i) % self.n]
	return (c[2], c[1], c[0]) if bgr else c

	@staticmethod
	def hex2rgb(h): # rgb order (PIL)
	return tuple(int(h[1 + i : 1 + i + 2], 16) for i in (0, 2, 4))


	@contextmanager
	def torch_distributed_zero_first(local_rank: int):
	"""
	Decorator to make all processes in distributed training wait for each local_master to do something.
	"""
	if local_rank not in [-1, 0]:
	dist.barrier(device_ids=[local_rank])
	yield
	if local_rank == 0:
	dist.barrier(device_ids=[0])


	def create_dataloader(path, imgsz, batch_size, stride, single_cls=False, hyp=None, augment=False, cache=False, pad=0.0,
	rect=False, rank=-1, workers=8, image_weights=False, quad=False, prefix=''):
	# Make sure only the first process in DDP process the dataset first, and the following others can use the cache
	with torch_distributed_zero_first(rank):
	dataset = LoadImagesAndLabels(path, imgsz, batch_size,
	augment=augment, # augment images
	hyp=hyp, # augmentation hyperparameters
	rect=rect, # rectangular training
	cache_images=cache,
	single_cls=single_cls,
	stride=int(stride),
	pad=pad,
	image_weights=image_weights,
	prefix=prefix)

	batch_size = min(batch_size, len(dataset))
	nw = min([os.cpu_count(), batch_size if batch_size > 1 else 0, workers]) # number of workers
	sampler = torch.utils.data.distributed.DistributedSampler(dataset) if rank != -1 else None
	loader = torch.utils.data.DataLoader if image_weights else InfiniteDataLoader
	# Use torch.utils.data.DataLoader() if dataset.properties will update during training else InfiniteDataLoader()
	dataloader = loader(dataset,
	batch_size=batch_size,
	num_workers=nw,
	sampler=sampler,
	pin_memory=True,
	collate_fn=LoadImagesAndLabels.collate_fn4 if quad else LoadImagesAndLabels.collate_fn)
	return dataloader, dataset


	class LoadImagesAndLabels(Dataset):
	# YOLOv5 train_loader/val_loader, loads images and labels for training and validation
	cache_version = 0.5 # dataset labels *.cache version

	def __init__(self, path, img_size=640, batch_size=16, augment=False, hyp=None, rect=False, image_weights=False,
	cache_images=False, single_cls=False, stride=32, pad=0.0, prefix=''):
	self.img_size = img_size
	self.augment = augment
	self.hyp = hyp
	self.image_weights = image_weights
	self.rect = False if image_weights else rect
	self.mosaic = self.augment and not self.rect # load 4 images at a time into a mosaic (only during training)
	self.mosaic_border = [-img_size // 2, -img_size // 2]
	self.stride = stride
	self.path = path
	self.albumentations = Albumentations() if augment else None

	try:
	f = [] # image files
	for p in path if isinstance(path, list) else [path]:
	p = Path(p) # os-agnostic
	if p.is_dir(): # dir
	f += glob.glob(str(p / '*' / '.*'), recursive=True)
	# f = list(p.rglob('*/.*')) # pathlib
	elif p.is_file(): # file
	with open(p, 'r') as t:
	t = t.read().strip().splitlines()
	parent = str(p.parent) + os.sep
	f += [x.replace('./', parent) if x.startswith('./') else x for x in t] # local to global path
	# f += [p.parent / x.lstrip(os.sep) for x in t] # local to global path (pathlib)
	else:
	raise Exception(f'{prefix}{p} does not exist')
	self.img_files = sorted([x.replace('/', os.sep) for x in f if x.split('.')[-1].lower() in IMG_FORMATS])
	# self.img_files = sorted([x for x in f if x.suffix[1:].lower() in img_formats]) # pathlib
	assert self.img_files, f'{prefix}No images found'
	except Exception as e:
	raise Exception(f'{prefix}Error loading data from {path}: {e}\nSee {HELP_URL}')

	# Check cache
	self.label_files = img2label_paths(self.img_files) # labels
	cache_path = (p if p.is_file() else Path(self.label_files[0]).parent).with_suffix('.cache')
	try:
	cache, exists = np.load(cache_path, allow_pickle=True).item(), True # load dict
	assert cache['version'] == self.cache_version # same version
	assert cache['hash'] == get_hash(self.label_files + self.img_files) # same hash
	except:
	cache, exists = self.cache_labels(cache_path, prefix), False # cache

	# Display cache
	nf, nm, ne, nc, n = cache.pop('results') # found, missing, empty, corrupted, total
	if exists:
	d = f"Scanning '{cache_path}' images and labels... {nf} found, {nm} missing, {ne} empty, {nc} corrupted"
	tqdm(None, desc=prefix + d, total=n, initial=n) # display cache results
	if cache['msgs']:
	logging.info('\n'.join(cache['msgs'])) # display warnings
	assert nf > 0 or not augment, f'{prefix}No labels in {cache_path}. Can not train without labels. See {HELP_URL}'

	# Read cache
	[cache.pop(k) for k in ('hash', 'version', 'msgs')] # remove items
	labels, shapes, self.segments = zip(*cache.values())
	self.labels = list(labels)
	self.shapes = np.array(shapes, dtype=np.float64)
	self.img_files = list(cache.keys()) # update
	self.label_files = img2label_paths(cache.keys()) # update
	if single_cls:
	for x in self.labels:
	x[:, 0] = 0

	n = len(shapes) # number of images
	bi = np.floor(np.arange(n) / batch_size).astype(int) # batch index
	nb = bi[-1] + 1 # number of batches
	self.batch = bi # batch index of image
	self.n = n
	self.indices = range(n)

	# Rectangular Training
	if self.rect:
	# Sort by aspect ratio
	s = self.shapes # wh
	ar = s[:, 1] / s[:, 0] # aspect ratio
	irect = ar.argsort()
	self.img_files = [self.img_files[i] for i in irect]
	self.label_files = [self.label_files[i] for i in irect]
	self.labels = [self.labels[i] for i in irect]
	self.shapes = s[irect] # wh
	ar = ar[irect]

	# Set training image shapes
	shapes = [[1, 1]] * nb
	for i in range(nb):
	ari = ar[bi == i]
	mini, maxi = ari.min(), ari.max()
	if maxi < 1:
	shapes[i] = [maxi, 1]
	elif mini > 1:
	shapes[i] = [1, 1 / mini]

	self.batch_shapes = np.ceil(np.array(shapes) * img_size / stride + pad).astype(int) * stride

	# Cache images into memory for faster training (WARNING: large datasets may exceed system RAM)
	self.imgs, self.img_npy = [None] * n, [None] * n
	if cache_images:
	if cache_images == 'disk':
	self.im_cache_dir = Path(Path(self.img_files[0]).parent.as_posix() + '_npy')
	self.img_npy = [self.im_cache_dir / Path(f).with_suffix('.npy').name for f in self.img_files]
	self.im_cache_dir.mkdir(parents=True, exist_ok=True)
	gb = 0 # Gigabytes of cached images
	self.img_hw0, self.img_hw = [None] * n, [None] * n
	results = ThreadPool(NUM_THREADS).imap(lambda x: load_image(*x), zip(repeat(self), range(n)))
	pbar = tqdm(enumerate(results), total=n)
	for i, x in pbar:
	if cache_images == 'disk':
	if not self.img_npy[i].exists():
	np.save(self.img_npy[i].as_posix(), x[0])
	gb += self.img_npy[i].stat().st_size
	else:
	self.imgs[i], self.img_hw0[i], self.img_hw[i] = x # im, hw_orig, hw_resized = load_image(self, i)
	gb += self.imgs[i].nbytes
	pbar.desc = f'{prefix}Caching images ({gb / 1E9:.1f}GB {cache_images})'
	pbar.close()

	def cache_labels(self, path=Path('./labels.cache'), prefix=''):
	# Cache dataset labels, check images and read shapes
	x = {} # dict
	nm, nf, ne, nc, msgs = 0, 0, 0, 0, [] # number missing, found, empty, corrupt, messages
	desc = f"{prefix}Scanning '{path.parent / path.stem}' images and labels..."
	with Pool(NUM_THREADS) as pool:
	pbar = tqdm(pool.imap(verify_image_label, zip(self.img_files, self.label_files, repeat(prefix))), desc=desc, total=len(self.img_files))
	for im_file, l, shape, segments, nm_f, nf_f, ne_f, nc_f, msg in pbar:
	nm += nm_f
	nf += nf_f
	ne += ne_f
	nc += nc_f
	if im_file:
	x[im_file] = [l, shape, segments]
	if msg:
	msgs.append(msg)
	pbar.desc = f"{desc}{nf} found, {nm} missing, {ne} empty, {nc} corrupted"

	pbar.close()
	if msgs:
	logging.info('\n'.join(msgs))
	if nf == 0:
	logging.info(f'{prefix}WARNING: No labels found in {path}. See {HELP_URL}')
	x['hash'] = get_hash(self.label_files + self.img_files)
	x['results'] = nf, nm, ne, nc, len(self.img_files)
	x['msgs'] = msgs # warnings
	x['version'] = self.cache_version # cache version
	try:
	np.save(path, x) # save cache for next time
	path.with_suffix('.cache.npy').rename(path) # remove .npy suffix
	logging.info(f'{prefix}New cache created: {path}')
	except Exception as e:
	logging.info(f'{prefix}WARNING: Cache directory {path.parent} is not writeable: {e}') # path not writeable
	return x

	def __len__(self):
	return len(self.img_files)

	# def __iter__(self):
	# self.count = -1
	# print('ran dataset iter')
	# #self.shuffled_vector = np.random.permutation(self.nF) if self.augment else np.arange(self.nF)
	# return self

	def __getitem__(self, index):
	index = self.indices[index] # linear, shuffled, or image_weights

	hyp = self.hyp
	mosaic = self.mosaic and random.random() < hyp['mosaic']
	if mosaic:
	# Load mosaic
	img, labels = load_mosaic(self, index)
	shapes = None

	# MixUp augmentation
	if random.random() < hyp['mixup']:
	img, labels = mixup(img, labels, *load_mosaic(self, random.randint(0, self.n - 1)))

	else:
	# Load image
	img, (h0, w0), (h, w) = load_image(self, index)

	# Letterbox
	shape = self.batch_shapes[self.batch[index]] if self.rect else self.img_size # final letterboxed shape
	img, ratio, pad = letterbox(img, shape, auto=False, scaleup=self.augment)
	shapes = (h0, w0), ((h / h0, w / w0), pad) # for COCO mAP rescaling

	labels = self.labels[index].copy()
	if labels.size: # normalized xywh to pixel xyxy format
	labels[:, 1:] = xywhn2xyxy(labels[:, 1:], ratio[0] * w, ratio[1] * h, padw=pad[0], padh=pad[1])

	if self.augment:
	img, labels = random_perspective(img, labels,
	degrees=hyp['degrees'],
	translate=hyp['translate'],
	scale=hyp['scale'],
	shear=hyp['shear'],
	perspective=hyp['perspective'])

	nl = len(labels) # number of labels
	if nl:
	labels[:, 1:5] = xyxy2xywhn(labels[:, 1:5], w=img.shape[1], h=img.shape[0], clip=True, eps=1E-3)

	if self.augment:
	# Albumentations
	img, labels = self.albumentations(img, labels)
	nl = len(labels) # update after albumentations

	# HSV color-space
	augment_hsv(img, hgain=hyp['hsv_h'], sgain=hyp['hsv_s'], vgain=hyp['hsv_v'])

	# Flip up-down
	if random.random() < hyp['flipud']:
	img = np.flipud(img)
	if nl:
	labels[:, 2] = 1 - labels[:, 2]

	# Flip left-right
	if random.random() < hyp['fliplr']:
	img = np.fliplr(img)
	if nl:
	labels[:, 1] = 1 - labels[:, 1]

	# Cutouts
	# labels = cutout(img, labels, p=0.5)

	labels_out = torch.zeros((nl, 6))
	if nl:
	labels_out[:, 1:] = torch.from_numpy(labels)

	# Convert
	img = img.transpose((2, 0, 1))[::-1] # HWC to CHW, BGR to RGB
	img = np.ascontiguousarray(img)

	return torch.from_numpy(img), labels_out, self.img_files[index], shapes

	@staticmethod
	def collate_fn(batch):
	img, label, path, shapes = zip(*batch) # transposed
	for i, l in enumerate(label):
	l[:, 0] = i # add target image index for build_targets()
	return torch.stack(img, 0), torch.cat(label, 0), path, shapes

	@staticmethod
	def collate_fn4(batch):
	img, label, path, shapes = zip(*batch) # transposed
	n = len(shapes) // 4
	img4, label4, path4, shapes4 = [], [], path[:n], shapes[:n]

	ho = torch.tensor([[0., 0, 0, 1, 0, 0]])
	wo = torch.tensor([[0., 0, 1, 0, 0, 0]])
	s = torch.tensor([[1, 1, .5, .5, .5, .5]]) # scale
	for i in range(n): # zidane torch.zeros(16,3,720,1280) # BCHW
	i *= 4
	if random.random() < 0.5:
	im = F.interpolate(img[i].unsqueeze(0).float(), scale_factor=2., mode='bilinear', align_corners=False)[
	0].type(img[i].type())
	l = label[i]
	else:
	im = torch.cat((torch.cat((img[i], img[i + 1]), 1), torch.cat((img[i + 2], img[i + 3]), 1)), 2)
	l = torch.cat((label[i], label[i + 1] + ho, label[i + 2] + wo, label[i + 3] + ho + wo), 0) * s
	img4.append(im)
	label4.append(l)

	for i, l in enumerate(label4):
	l[:, 0] = i # add target image index for build_targets()

	return torch.stack(img4, 0), torch.cat(label4, 0), path4, shapes4


	def coco80_to_coco91_class(): # converts 80-index (val2014) to 91-index (paper)
	# https://tech.amikelive.com/node-718/what-object-categories-labels-are-in-coco-dataset/
	# a = np.loadtxt('data/coco.names', dtype='str', delimiter='\n')
	# b = np.loadtxt('data/coco_paper.names', dtype='str', delimiter='\n')
	# x1 = [list(a[i] == b).index(True) + 1 for i in range(80)] # darknet to coco
	# x2 = [list(b[i] == a).index(True) if any(b[i] == a) else None for i in range(91)] # coco to darknet
	x = [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 27, 28, 31, 32, 33, 34,
	35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63,
	64, 65, 67, 70, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 84, 85, 86, 87, 88, 89, 90]
	return x


	def check_dataset(data, autodownload=True):
	# Download and/or unzip dataset if not found locally
	# Usage: https://github.com/ultralytics/yolov5/releases/download/v1.0/coco128_with_yaml.zip

	# Download (optional)
	extract_dir = ''
	if isinstance(data, (str, Path)) and str(data).endswith('.zip'): # i.e. gs://bucket/dir/coco128.zip
	download(data, dir='../datasets', unzip=True, delete=False, curl=False, threads=1)
	data = next((Path('../datasets') / Path(data).stem).rglob('*.yaml'))
	extract_dir, autodownload = data.parent, False

	# Read yaml (optional)
	if isinstance(data, (str, Path)):
	with open(data, errors='ignore') as f:
	data = yaml.safe_load(f) # dictionary

	# Parse yaml
	path = extract_dir or Path(data.get('path') or '') # optional 'path' default to '.'
	for k in 'train', 'val', 'test':
	if data.get(k): # prepend path
	data[k] = str(path / data[k]) if isinstance(data[k], str) else [str(path / x) for x in data[k]]

	assert 'nc' in data, "Dataset 'nc' key missing."
	if 'names' not in data:
	data['names'] = [f'class{i}' for i in range(data['nc'])] # assign class names if missing
	train, val, test, s = [data.get(x) for x in ('train', 'val', 'test', 'download')]
	if val:
	val = [Path(x).resolve() for x in (val if isinstance(val, list) else [val])] # val path
	if not all(x.exists() for x in val):
	print('\nWARNING: Dataset not found, nonexistent paths: %s' % [str(x) for x in val if not x.exists()])
	if s and autodownload: # download script
	root = path.parent if 'path' in data else '..' # unzip directory i.e. '../'
	if s.startswith('http') and s.endswith('.zip'): # URL
	f = Path(s).name # filename
	print(f'Downloading {s} to {f}...')
	torch.hub.download_url_to_file(s, f)
	Path(root).mkdir(parents=True, exist_ok=True) # create root
	ZipFile(f).extractall(path=root) # unzip
	Path(f).unlink() # remove zip
	r = None # success
	elif s.startswith('bash '): # bash script
	print(f'Running {s} ...')
	r = os.system(s)
	else: # python script
	r = exec(s, {'yaml': data}) # return None
	print(f"Dataset autodownload {f'success, saved to {root}' if r in (0, None) else 'failure'}\n")
	else:
	raise Exception('Dataset not found.')

	return data # dictionary


	def box_iou(box1, box2):
	# https://github.com/pytorch/vision/blob/master/torchvision/ops/boxes.py
	"""
	Return intersection-over-union (Jaccard index) of boxes.
	Both sets of boxes are expected to be in (x1, y1, x2, y2) format.
	Arguments:
	box1 (Tensor[N, 4])
	box2 (Tensor[M, 4])
	Returns:
	iou (Tensor[N, M]): the NxM matrix containing the pairwise
	IoU values for every element in boxes1 and boxes2
	"""

	def box_area(box):
	# box = 4xn
	return (box[2] - box[0]) * (box[3] - box[1])

	area1 = box_area(box1.T)
	area2 = box_area(box2.T)

	# inter(N,M) = (rb(N,M,2) - lt(N,M,2)).clamp(0).prod(2)
	inter = (torch.min(box1[:, None, 2:], box2[:, 2:]) - torch.max(box1[:, None, :2], box2[:, :2])).clamp(0).prod(2)
	return inter / (area1[:, None] + area2 - inter) # iou = inter / (area1 + area2 - inter)


	def increment_path(path, exist_ok=False, sep='', mkdir=False):
	# Increment file or directory path, i.e. runs/exp --> runs/exp{sep}2, runs/exp{sep}3, ... etc.
	path = Path(path) # os-agnostic
	if path.exists() and not exist_ok:
	suffix = path.suffix
	path = path.with_suffix('')
	dirs = glob.glob(f"{path}{sep}*") # similar paths
	matches = [re.search(rf"%s{sep}(\d+)" % path.stem, d) for d in dirs]
	i = [int(m.groups()[0]) for m in matches if m] # indices
	n = max(i) + 1 if i else 2 # increment number
	path = Path(f"{path}{sep}{n}{suffix}") # update path
	dir = path if path.suffix == '' else path.parent # directory
	if not dir.exists() and mkdir:
	dir.mkdir(parents=True, exist_ok=True) # make directory
	return path


	def colorstr(*input):
	# Colors a string https://en.wikipedia.org/wiki/ANSI_escape_code, i.e. colorstr('blue', 'hello world')
	*args, string = input if len(input) > 1 else ('blue', 'bold', input[0]) # color arguments, string
	colors = {'black': '\033[30m', # basic colors
	'red': '\033[31m',
	'green': '\033[32m',
	'yellow': '\033[33m',
	'blue': '\033[34m',
	'magenta': '\033[35m',
	'cyan': '\033[36m',
	'white': '\033[37m',
	'bright_black': '\033[90m', # bright colors
	'bright_red': '\033[91m',
	'bright_green': '\033[92m',
	'bright_yellow': '\033[93m',
	'bright_blue': '\033[94m',
	'bright_magenta': '\033[95m',
	'bright_cyan': '\033[96m',
	'bright_white': '\033[97m',
	'end': '\033[0m', # misc
	'bold': '\033[1m',
	'underline': '\033[4m'}
	return ''.join(colors[x] for x in args) + f'{string}' + colors['end']


	def ap_per_class(tp, conf, pred_cls, target_cls, plot=False, save_dir='.', names=()):
	""" Compute the average precision, given the recall and precision curves.
	Source: https://github.com/rafaelpadilla/Object-Detection-Metrics.
	# Arguments
	tp: True positives (nparray, nx1 or nx10).
	conf: Objectness value from 0-1 (nparray).
	pred_cls: Predicted object classes (nparray).
	target_cls: True object classes (nparray).
	plot: Plot precision-recall curve at mAP@0.5
	save_dir: Plot save directory
	# Returns
	The average precision as computed in py-faster-rcnn.
	"""

	# Sort by objectness
	i = np.argsort(-conf)
	tp, conf, pred_cls = tp[i], conf[i], pred_cls[i]

	# Find unique classes
	unique_classes = np.unique(target_cls)
	nc = unique_classes.shape[0] # number of classes, number of detections

	# Create Precision-Recall curve and compute AP for each class
	px, py = np.linspace(0, 1, 1000), [] # for plotting
	ap, p, r = np.zeros((nc, tp.shape[1])), np.zeros((nc, 1000)), np.zeros((nc, 1000))
	for ci, c in enumerate(unique_classes):
	i = pred_cls == c
	n_l = (target_cls == c).sum() # number of labels
	n_p = i.sum() # number of predictions

	if n_p == 0 or n_l == 0:
	continue
	else:
	# Accumulate FPs and TPs
	fpc = (1 - tp[i]).cumsum(0)
	tpc = tp[i].cumsum(0)

	# Recall
	recall = tpc / (n_l + 1e-16) # recall curve
	r[ci] = np.interp(-px, -conf[i], recall[:, 0], left=0) # negative x, xp because xp decreases

	# Precision
	precision = tpc / (tpc + fpc) # precision curve
	p[ci] = np.interp(-px, -conf[i], precision[:, 0], left=1) # p at pr_score

	# AP from recall-precision curve
	for j in range(tp.shape[1]):
	ap[ci, j], mpre, mrec = compute_ap(recall[:, j], precision[:, j])
	if plot and j == 0:
	py.append(np.interp(px, mrec, mpre)) # precision at mAP@0.5

	# Compute F1 (harmonic mean of precision and recall)
	f1 = 2 * p * r / (p + r + 1e-16)
	if plot:
	plot_pr_curve(px, py, ap, Path(save_dir) / 'PR_curve.png', names)
	plot_mc_curve(px, f1, Path(save_dir) / 'F1_curve.png', names, ylabel='F1')
	plot_mc_curve(px, p, Path(save_dir) / 'P_curve.png', names, ylabel='Precision')
	plot_mc_curve(px, r, Path(save_dir) / 'R_curve.png', names, ylabel='Recall')

	i = f1.mean(0).argmax() # max F1 index
	return p[:, i], r[:, i], ap, f1[:, i], unique_classes.astype('int32')


	def compute_ap(recall, precision):
	""" Compute the average precision, given the recall and precision curves
	# Arguments
	recall: The recall curve (list)
	precision: The precision curve (list)
	# Returns
	Average precision, precision curve, recall curve
	"""

	# Append sentinel values to beginning and end
	mrec = np.concatenate(([0.0], recall, [1.0]))
	mpre = np.concatenate(([1.0], precision, [0.0]))

	# Compute the precision envelope
	mpre = np.flip(np.maximum.accumulate(np.flip(mpre)))

	# Integrate area under curve
	method = 'interp' # methods: 'continuous', 'interp'
	if method == 'interp':
	x = np.linspace(0, 1, 101) # 101-point interp (COCO)
	ap = np.trapz(np.interp(x, mrec, mpre), x) # integrate
	else: # 'continuous'
	i = np.where(mrec[1:] != mrec[:-1])[0] # points where x axis (recall) changes
	ap = np.sum((mrec[i + 1] - mrec[i]) * mpre[i + 1]) # area under curve

	return ap, mpre, mrec


	class ConfusionMatrix:
	# Updated version of https://github.com/kaanakan/object_detection_confusion_matrix
	def __init__(self, nc, conf=0.25, iou_thres=0.45):
	self.matrix = np.zeros((nc + 1, nc + 1))
	self.nc = nc # number of classes
	self.conf = conf
	self.iou_thres = iou_thres

	def process_batch(self, detections, labels):
	"""
	Return intersection-over-union (Jaccard index) of boxes.
	Both sets of boxes are expected to be in (x1, y1, x2, y2) format.
	Arguments:
	detections (Array[N, 6]), x1, y1, x2, y2, conf, class
	labels (Array[M, 5]), class, x1, y1, x2, y2
	Returns:
	None, updates confusion matrix accordingly
	"""
	detections = detections[detections[:, 4] > self.conf]
	gt_classes = labels[:, 0].int()
	detection_classes = detections[:, 5].int()
	iou = box_iou(labels[:, 1:], detections[:, :4])

	x = torch.where(iou > self.iou_thres)
	if x[0].shape[0]:
	matches = torch.cat((torch.stack(x, 1), iou[x[0], x[1]][:, None]), 1).cpu().numpy()
	if x[0].shape[0] > 1:
	matches = matches[matches[:, 2].argsort()[::-1]]
	matches = matches[np.unique(matches[:, 1], return_index=True)[1]]
	matches = matches[matches[:, 2].argsort()[::-1]]
	matches = matches[np.unique(matches[:, 0], return_index=True)[1]]
	else:
	matches = np.zeros((0, 3))

	n = matches.shape[0] > 0
	m0, m1, _ = matches.transpose().astype(np.int16)
	for i, gc in enumerate(gt_classes):
	j = m0 == i
	if n and sum(j) == 1:
	self.matrix[detection_classes[m1[j]], gc] += 1 # correct
	else:
	self.matrix[self.nc, gc] += 1 # background FP

	if n:
	for i, dc in enumerate(detection_classes):
	if not any(m1 == i):
	self.matrix[dc, self.nc] += 1 # background FN

	def matrix(self):
	return self.matrix

	def plot(self, normalize=True, save_dir='', names=()):
	try:
	import seaborn as sn

	array = self.matrix / ((self.matrix.sum(0).reshape(1, -1) + 1E-6) if normalize else 1) # normalize columns
	array[array < 0.005] = np.nan # don't annotate (would appear as 0.00)

	fig = plt.figure(figsize=(12, 9), tight_layout=True)
	sn.set(font_scale=1.0 if self.nc < 50 else 0.8) # for label size
	labels = (0 < len(names) < 99) and len(names) == self.nc # apply names to ticklabels
	with warnings.catch_warnings():
	warnings.simplefilter('ignore') # suppress empty matrix RuntimeWarning: All-NaN slice encountered
	sn.heatmap(array, annot=self.nc < 30, annot_kws={"size": 8}, cmap='Blues', fmt='.2f', square=True,
	xticklabels=names + ['background FP'] if labels else "auto",
	yticklabels=names + ['background FN'] if labels else "auto").set_facecolor((1, 1, 1))
	fig.axes[0].set_xlabel('True')
	fig.axes[0].set_ylabel('Predicted')
	fig.savefig(Path(save_dir) / 'confusion_matrix.png', dpi=250)
	plt.close()
	except Exception as e:
	print(f'WARNING: ConfusionMatrix plot failure: {e}')

	def print(self):
	for i in range(self.nc + 1):
	print(' '.join(map(str, self.matrix[i])))


	def output_to_target(output):
	# Convert model output to target format [batch_id, class_id, x, y, w, h, conf]
	targets = []
	for i, o in enumerate(output):
	for *box, conf, cls in o.cpu().numpy():
	targets.append([i, cls, list(xyxy2xywh(np.array(box)[None])), conf])
	return np.array(targets)


	def plot_val_study(file='', dir='', x=None): # from utils.plots import *; plot_val_study()
	# Plot file=study.txt generated by val.py (or plot all study*.txt in dir)
	save_dir = Path(file).parent if file else Path(dir)
	plot2 = False # plot additional results
	if plot2:
	ax = plt.subplots(2, 4, figsize=(10, 6), tight_layout=True)[1].ravel()

	fig2, ax2 = plt.subplots(1, 1, figsize=(8, 4), tight_layout=True)
	# for f in [save_dir / f'study_coco_{x}.txt' for x in ['yolov5n6', 'yolov5s6', 'yolov5m6', 'yolov5l6', 'yolov5x6']]:
	for f in sorted(save_dir.glob('study*.txt')):
	y = np.loadtxt(f, dtype=np.float32, usecols=[0, 1, 2, 3, 7, 8, 9], ndmin=2).T
	x = np.arange(y.shape[1]) if x is None else np.array(x)
	if plot2:
	s = ['P', 'R', 'mAP@.5', 'mAP@.5:.95', 't_preprocess (ms/img)', 't_inference (ms/img)', 't_NMS (ms/img)']
	for i in range(7):
	ax[i].plot(x, y[i], '.-', linewidth=2, markersize=8)
	ax[i].set_title(s[i])

	j = y[3].argmax() + 1
	ax2.plot(y[5, 1:j], y[3, 1:j] * 1E2, '.-', linewidth=2, markersize=8,
	label=f.stem.replace('study_coco_', '').replace('yolo', 'YOLO'))

	ax2.plot(1E3 / np.array([209, 140, 97, 58, 35, 18]), [34.6, 40.5, 43.0, 47.5, 49.7, 51.5],
	'k.-', linewidth=2, markersize=8, alpha=.25, label='EfficientDet')

	ax2.grid(alpha=0.2)
	ax2.set_yticks(np.arange(20, 60, 5))
	ax2.set_xlim(0, 57)
	ax2.set_ylim(25, 55)
	ax2.set_xlabel('GPU Speed (ms/img)')
	ax2.set_ylabel('COCO AP val')
	ax2.legend(loc='lower right')
	f = save_dir / 'study.png'
	print(f'Saving {f}...')
	plt.savefig(f, dpi=300)


	def check_yaml(file, suffix=('.yaml', '.yml')):
	# Search/download YAML file (if necessary) and return path, checking suffix
	return check_file(file, suffix)


	def check_file(file, suffix=''):
	# Search/download file (if necessary) and return path
	check_suffix(file, suffix) # optional
	file = str(file) # convert to str()
	if Path(file).is_file() or file == '': # exists
	return file
	elif file.startswith(('http:/', 'https:/')): # download
	url = str(Path(file)).replace(':/', '://') # Pathlib turns :// -> :/
	file = Path(urllib.parse.unquote(file).split('?')[0]).name # '%2F' to '/', split https://url.com/file.txt?auth
	print(f'Downloading {url} to {file}...')
	torch.hub.download_url_to_file(url, file)
	assert Path(file).exists() and Path(file).stat().st_size > 0, f'File download failed: {url}' # check
	return file
	else: # search
	files = []
	for d in 'data', 'models', 'utils': # search directories
	files.extend(glob.glob(str(ROOT / d / '**' / file), recursive=True)) # find file
	assert len(files), f'File not found: {file}' # assert file was found
	assert len(files) == 1, f"Multiple files match '{file}', specify exact path: {files}" # assert unique
	return files[0] # return file


	def check_suffix(file='yolov5s.pt', suffix=('.pt',), msg=''):
	# Check file(s) for acceptable suffixes
	if file and suffix:
	if isinstance(suffix, str):
	suffix = [suffix]
	for f in file if isinstance(file, (list, tuple)) else [file]:
	assert Path(f).suffix.lower() in suffix, f"{msg}{f} acceptable suffix is {suffix}"


	def img2label_paths(img_paths):
	# Define label paths as a function of image paths
	sa, sb = os.sep + 'images' + os.sep, os.sep + 'labels' + os.sep # /images/, /labels/ substrings
	return [sb.join(x.rsplit(sa, 1)).rsplit('.', 1)[0] + '.txt' for x in img_paths]


	def exif_size(img):
	# Returns exif-corrected PIL size
	s = img.size # (width, height)
	try:
	rotation = dict(img._getexif().items())[orientation]
	if rotation == 6: # rotation 270
	s = (s[1], s[0])
	elif rotation == 8: # rotation 90
	s = (s[1], s[0])
	except:
	pass

	return s


	def verify_image_label(args):
	# Verify one image-label pair
	im_file, lb_file, prefix = args
	nm, nf, ne, nc, msg, segments = 0, 0, 0, 0, '', [] # number (missing, found, empty, corrupt), message, segments
	try:
	# verify images
	im = Image.open(im_file)
	im.verify() # PIL verify
	shape = exif_size(im) # image size
	assert (shape[0] > 9) & (shape[1] > 9), f'image size {shape} <10 pixels'
	assert im.format.lower() in IMG_FORMATS, f'invalid image format {im.format}'
	if im.format.lower() in ('jpg', 'jpeg'):
	with open(im_file, 'rb') as f:
	f.seek(-2, 2)
	if f.read() != b'\xff\xd9': # corrupt JPEG
	Image.open(im_file).save(im_file, format='JPEG', subsampling=0, quality=100) # re-save image
	msg = f'{prefix}WARNING: corrupt JPEG restored and saved {im_file}'

	# verify labels
	if os.path.isfile(lb_file):
	nf = 1 # label found
	with open(lb_file, 'r') as f:
	l = [x.split() for x in f.read().strip().splitlines() if len(x)]
	if any([len(x) > 8 for x in l]): # is segment
	classes = np.array([x[0] for x in l], dtype=np.float32)
	segments = [np.array(x[1:], dtype=np.float32).reshape(-1, 2) for x in l] # (cls, xy1...)
	l = np.concatenate((classes.reshape(-1, 1), segments2boxes(segments)), 1) # (cls, xywh)
	l = np.array(l, dtype=np.float32)
	if len(l):
	assert l.shape[1] == 5, 'labels require 5 columns each'
	assert (l >= 0).all(), 'negative labels'
	assert (l[:, 1:] <= 1).all(), 'non-normalized or out of bounds coordinate labels'
	assert np.unique(l, axis=0).shape[0] == l.shape[0], 'duplicate labels'
	else:
	ne = 1 # label empty
	l = np.zeros((0, 5), dtype=np.float32)
	else:
	nm = 1 # label missing
	l = np.zeros((0, 5), dtype=np.float32)
	return im_file, l, shape, segments, nm, nf, ne, nc, msg
	except Exception as e:
	nc = 1
	msg = f'{prefix}WARNING: Ignoring corrupted image and/or label {im_file}: {e}'
	return [None, None, None, None, nm, nf, ne, nc, msg]


	def segments2boxes(segments):
	# Convert segment labels to box labels, i.e. (cls, xy1, xy2, ...) to (cls, xywh)
	boxes = []
	for s in segments:
	x, y = s.T # segment xy
	boxes.append([x.min(), y.min(), x.max(), y.max()]) # cls, xyxy
	return xyxy2xywh(np.array(boxes)) # cls, xywh


	def get_hash(paths):
	# Returns a single hash value of a list of paths (files or dirs)
	size = sum(os.path.getsize(p) for p in paths if os.path.exists(p)) # sizes
	h = hashlib.md5(str(size).encode()) # hash sizes
	h.update(''.join(paths).encode()) # hash paths
	return h.hexdigest() # return hash


	class InfiniteDataLoader(torch.utils.data.dataloader.DataLoader):
	""" Dataloader that reuses workers

	Uses same syntax as vanilla DataLoader
	"""

	def __init__(self, args, *kwargs):
	super().__init__(args, *kwargs)
	object.__setattr__(self, 'batch_sampler', _RepeatSampler(self.batch_sampler))
	self.iterator = super().__iter__()

	def __len__(self):
	return len(self.batch_sampler.sampler)

	def __iter__(self):
	for i in range(len(self)):
	yield next(self.iterator)


	class _RepeatSampler(object):
	""" Sampler that repeats forever

	Args:
	sampler (Sampler)
	"""

	def __init__(self, sampler):
	self.sampler = sampler

	def __iter__(self):
	while True:
	yield from iter(self.sampler)


	def load_image(self, i):
	# loads 1 image from dataset index 'i', returns im, original hw, resized hw
	im = self.imgs[i]
	if im is None: # not cached in ram
	npy = self.img_npy[i]
	if npy and npy.exists(): # load npy
	im = np.load(npy)
	else: # read image
	path = self.img_files[i]
	im = cv2.imread(path) # BGR
	assert im is not None, 'Image Not Found ' + path
	h0, w0 = im.shape[:2] # orig hw
	r = self.img_size / max(h0, w0) # ratio
	if r != 1: # if sizes are not equal
	im = cv2.resize(im, (int(w0 * r), int(h0 * r)),
	interpolation=cv2.INTER_AREA if r < 1 and not self.augment else cv2.INTER_LINEAR)
	return im, (h0, w0), im.shape[:2] # im, hw_original, hw_resized
	else:
	return self.imgs[i], self.img_hw0[i], self.img_hw[i] # im, hw_original, hw_resized


	def xywhn2xyxy(x, w=640, h=640, padw=0, padh=0):
	# Convert nx4 boxes from [x, y, w, h] normalized to [x1, y1, x2, y2] where xy1=top-left, xy2=bottom-right
	y = x.clone() if isinstance(x, torch.Tensor) else np.copy(x)
	y[:, 0] = w * (x[:, 0] - x[:, 2] / 2) + padw # top left x
	y[:, 1] = h * (x[:, 1] - x[:, 3] / 2) + padh # top left y
	y[:, 2] = w * (x[:, 0] + x[:, 2] / 2) + padw # bottom right x
	y[:, 3] = h * (x[:, 1] + x[:, 3] / 2) + padh # bottom right y
	return y


	def xyxy2xywhn(x, w=640, h=640, clip=False, eps=0.0):
	# Convert nx4 boxes from [x1, y1, x2, y2] to [x, y, w, h] normalized where xy1=top-left, xy2=bottom-right
	if clip:
	clip_coords(x, (h - eps, w - eps)) # warning: inplace clip
	y = x.clone() if isinstance(x, torch.Tensor) else np.copy(x)
	y[:, 0] = ((x[:, 0] + x[:, 2]) / 2) / w # x center
	y[:, 1] = ((x[:, 1] + x[:, 3]) / 2) / h # y center
	y[:, 2] = (x[:, 2] - x[:, 0]) / w # width
	y[:, 3] = (x[:, 3] - x[:, 1]) / h # height
	return y


	def post_process(x):
	grid = np.load("./grid.npy", allow_pickle=True)
	anchor_grid = np.load("./anchor_grid.npy", allow_pickle=True)
	x = list(x)
	z = [] # inference output
	stride = [8, 16, 32]
	for i in range(3):
	bs, _, ny, nx = x[i].shape # x(bs,255,20,20) to x(bs,3,20,20,85)
	x[i] = (
	torch.tensor(x[i])
	.view(bs, 3, 85, ny, nx)
	.permute(0, 1, 3, 4, 2)
	.contiguous()
	)
	y = x[i].sigmoid()
	xy = (y[..., 0:2] * 2.0 - 0.5 + grid[i]) * stride[i]
	wh = (y[..., 2:4] * 2) ** 2 * anchor_grid[i]
	y = torch.cat((xy, wh, y[..., 4:]), -1)
	z.append(y.view(bs, -1, 85))

	return (torch.cat(z, 1), x)