Upload 4 files

5604fdf verified 3 months ago

13.7 kB

	# General utils

	import glob
	import os
	import random
	import time

	import cv2
	import numpy as np
	import torch
	import torchvision
	from PIL import Image

	# Settings
	torch.set_printoptions(linewidth=320, precision=5, profile='long')
	np.set_printoptions(linewidth=320, formatter={'float_kind': '{:11.5g}'.format}) # format short g, %precision=5
	cv2.setNumThreads(0) # prevent OpenCV from multithreading (incompatible with PyTorch DataLoader)
	os.environ['NUMEXPR_MAX_THREADS'] = str(min(os.cpu_count(), 8)) # NumExpr max threads

	def init_seeds(seed=0):
	# Initialize random number generator (RNG) seeds
	random.seed(seed)
	np.random.seed(seed)
	init_torch_seeds(seed)


	def get_latest_run(search_dir='.'):
	# Return path to most recent 'last.pt' in /runs (i.e. to --resume from)
	last_list = glob.glob(f'{search_dir}/*/last.pt', recursive=True)
	return max(last_list, key=os.path.getctime) if last_list else ''


	def imwrite(img, file_path, params=None, auto_mkdir=True):
	"""Write image to file.

	Args:
	img (ndarray): Image array to be written.
	file_path (str): Image file path.
	params (None or list): Same as opencv's :func:`imwrite` interface.
	auto_mkdir (bool): If the parent folder of `file_path` does not exist,
	whether to create it automatically.

	Returns:
	bool: Successful or not.
	"""
	if auto_mkdir:
	dir_name = os.path.abspath(os.path.dirname(file_path))
	os.makedirs(dir_name, exist_ok=True)
	return cv2.imwrite(file_path, img, params)


	def img2tensor(imgs, bgr2rgb=True, float32=True):
	"""Numpy array to tensor.

	Args:
	imgs (list[ndarray] \| ndarray): Input images.
	bgr2rgb (bool): Whether to change bgr to rgb.
	float32 (bool): Whether to change to float32.

	Returns:
	list[tensor] \| tensor: Tensor images. If returned results only have
	one element, just return tensor.
	"""

	def _totensor(img, bgr2rgb, float32):
	if img.shape[2] == 3 and bgr2rgb:
	if img.dtype == 'float64':
	img = img.astype('float32')
	img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
	img = torch.from_numpy(img.transpose(2, 0, 1))
	if float32:
	img = img.float()
	return img

	if isinstance(imgs, list):
	return [_totensor(img, bgr2rgb, float32) for img in imgs]
	else:
	return _totensor(imgs, bgr2rgb, float32)

	def is_gray(img, threshold=10):
	img = Image.fromarray(img)
	if len(img.getbands()) == 1:
	return True
	img1 = np.asarray(img.getchannel(channel=0), dtype=np.int16)
	img2 = np.asarray(img.getchannel(channel=1), dtype=np.int16)
	img3 = np.asarray(img.getchannel(channel=2), dtype=np.int16)
	diff1 = (img1 - img2).var()
	diff2 = (img2 - img3).var()
	diff3 = (img3 - img1).var()
	diff_sum = (diff1 + diff2 + diff3) / 3.0
	if diff_sum <= threshold:
	return True
	else:
	return False

	def rgb2gray(img, out_channel=3):
	r, g, b = img[:,:,0], img[:,:,1], img[:,:,2]
	gray = 0.2989 * r + 0.5870 * g + 0.1140 * b
	if out_channel == 3:
	gray = gray[:,:,np.newaxis].repeat(3, axis=2)
	return gray

	def bgr2gray(img, out_channel=3):
	b, g, r = img[:,:,0], img[:,:,1], img[:,:,2]
	gray = 0.2989 * r + 0.5870 * g + 0.1140 * b
	if out_channel == 3:
	gray = gray[:,:,np.newaxis].repeat(3, axis=2)
	return gray

	def calc_mean_std(feat, eps=1e-5):
	"""
	Args:
	feat (numpy): 3D [w h c]s
	"""
	size = feat.shape
	assert len(size) == 3, 'The input feature should be 3D tensor.'
	c = size[2]
	feat_var = feat.reshape(-1, c).var(axis=0) + eps
	feat_std = np.sqrt(feat_var).reshape(1, 1, c)
	feat_mean = feat.reshape(-1, c).mean(axis=0).reshape(1, 1, c)
	return feat_mean, feat_std


	def adain_npy(content_feat, style_feat):
	"""Adaptive instance normalization for numpy.

	Args:
	content_feat (numpy): The input feature.
	style_feat (numpy): The reference feature.
	"""
	size = content_feat.shape
	style_mean, style_std = calc_mean_std(style_feat)
	content_mean, content_std = calc_mean_std(content_feat)
	normalized_feat = (content_feat - np.broadcast_to(content_mean, size)) / np.broadcast_to(content_std, size)
	return normalized_feat * np.broadcast_to(style_std, size) + np.broadcast_to(style_mean, size)

	def xyxy2xywh(x):
	# Convert nx4 boxes from [x1, y1, x2, y2] to [x, y, w, h] where xy1=top-left, xy2=bottom-right
	y = x.clone() if isinstance(x, torch.Tensor) else np.copy(x)
	y[:, 0] = (x[:, 0] + x[:, 2]) / 2 # x center
	y[:, 1] = (x[:, 1] + x[:, 3]) / 2 # y center
	y[:, 2] = x[:, 2] - x[:, 0] # width
	y[:, 3] = x[:, 3] - x[:, 1] # height
	return y


	def xywh2xyxy(x):
	# Convert nx4 boxes from [x, y, w, h] to [x1, y1, x2, y2] where xy1=top-left, xy2=bottom-right
	y = x.clone() if isinstance(x, torch.Tensor) else np.copy(x)
	y[:, 0] = x[:, 0] - x[:, 2] / 2 # top left x
	y[:, 1] = x[:, 1] - x[:, 3] / 2 # top left y
	y[:, 2] = x[:, 0] + x[:, 2] / 2 # bottom right x
	y[:, 3] = x[:, 1] + x[:, 3] / 2 # bottom right y
	return y


	def xywhn2xyxy(x, w=640, h=640, padw=32, padh=32):
	# Convert nx4 boxes from [x, y, w, h] normalized to [x1, y1, x2, y2] where xy1=top-left, xy2=bottom-right
	y = x.clone() if isinstance(x, torch.Tensor) else np.copy(x)
	y[:, 0] = w * (x[:, 0] - x[:, 2] / 2) + padw # top left x
	y[:, 1] = h * (x[:, 1] - x[:, 3] / 2) + padh # top left y
	y[:, 2] = w * (x[:, 0] + x[:, 2] / 2) + padw # bottom right x
	y[:, 3] = h * (x[:, 1] + x[:, 3] / 2) + padh # bottom right y
	return y


	def scale_coords(img1_shape, coords, img0_shape, ratio_pad=None):
	# Rescale coords (xyxy) from img1_shape to img0_shape
	if ratio_pad is None: # calculate from img0_shape
	gain = min(img1_shape[0] / img0_shape[0], img1_shape[1] / img0_shape[1]) # gain = old / new
	pad = (img1_shape[1] - img0_shape[1] * gain) / 2, (img1_shape[0] - img0_shape[0] * gain) / 2 # wh padding
	else:
	gain = ratio_pad[0][0]
	pad = ratio_pad[1]

	coords[:, [0, 2]] -= pad[0] # x padding
	coords[:, [1, 3]] -= pad[1] # y padding
	coords[:, :4] /= gain
	clip_coords(coords, img0_shape)
	return coords


	def clip_coords(boxes, img_shape):
	# Clip bounding xyxy bounding boxes to image shape (height, width)
	boxes[:, 0].clamp_(0, img_shape[1]) # x1
	boxes[:, 1].clamp_(0, img_shape[0]) # y1
	boxes[:, 2].clamp_(0, img_shape[1]) # x2
	boxes[:, 3].clamp_(0, img_shape[0]) # y2

	def box_iou(box1, box2):
	# https://github.com/pytorch/vision/blob/master/torchvision/ops/boxes.py
	"""
	Return intersection-over-union (Jaccard index) of boxes.
	Both sets of boxes are expected to be in (x1, y1, x2, y2) format.
	Arguments:
	box1 (Tensor[N, 4])
	box2 (Tensor[M, 4])
	Returns:
	iou (Tensor[N, M]): the NxM matrix containing the pairwise
	IoU values for every element in boxes1 and boxes2
	"""

	def box_area(box):
	# box = 4xn
	return (box[2] - box[0]) * (box[3] - box[1])

	area1 = box_area(box1.T)
	area2 = box_area(box2.T)

	# inter(N,M) = (rb(N,M,2) - lt(N,M,2)).clamp(0).prod(2)
	inter = (torch.min(box1[:, None, 2:], box2[:, 2:]) -
	torch.max(box1[:, None, :2], box2[:, :2])).clamp(0).prod(2)
	# iou = inter / (area1 + area2 - inter)
	return inter / (area1[:, None] + area2 - inter)


	def wh_iou(wh1, wh2):
	# Returns the nxm IoU matrix. wh1 is nx2, wh2 is mx2
	wh1 = wh1[:, None] # [N,1,2]
	wh2 = wh2[None] # [1,M,2]
	inter = torch.min(wh1, wh2).prod(2) # [N,M]
	# iou = inter / (area1 + area2 - inter)
	return inter / (wh1.prod(2) + wh2.prod(2) - inter)

	def non_max_suppression_face(prediction, conf_thres=0.25, iou_thres=0.45, classes=None, agnostic=False, labels=()):
	"""Performs Non-Maximum Suppression (NMS) on inference results
	Returns:
	detections with shape: nx6 (x1, y1, x2, y2, conf, cls)
	"""

	nc = prediction.shape[2] - 15 # number of classes
	xc = prediction[..., 4] > conf_thres # candidates

	# Settings
	min_wh, max_wh = 2, 4096 # (pixels) minimum and maximum box width and height
	time_limit = 10.0 # seconds to quit after
	redundant = True # require redundant detections
	multi_label = nc > 1 # multiple labels per box (adds 0.5ms/img)
	merge = False # use merge-NMS

	t = time.time()
	output = [torch.zeros((0, 16), device=prediction.device)] * prediction.shape[0]
	for xi, x in enumerate(prediction): # image index, image inference
	# Apply constraints
	# x[((x[..., 2:4] < min_wh) \| (x[..., 2:4] > max_wh)).any(1), 4] = 0 # width-height
	x = x[xc[xi]] # confidence

	# Cat apriori labels if autolabelling
	if labels and len(labels[xi]):
	l = labels[xi]
	v = torch.zeros((len(l), nc + 15), device=x.device)
	v[:, :4] = l[:, 1:5] # box
	v[:, 4] = 1.0 # conf
	v[range(len(l)), l[:, 0].long() + 15] = 1.0 # cls
	x = torch.cat((x, v), 0)

	# If none remain process next image
	if not x.shape[0]:
	continue

	# Compute conf
	x[:, 15:] = x[:, 4:5] # conf = obj_conf cls_conf

	# Box (center x, center y, width, height) to (x1, y1, x2, y2)
	box = xywh2xyxy(x[:, :4])

	# Detections matrix nx6 (xyxy, conf, landmarks, cls)
	if multi_label:
	i, j = (x[:, 15:] > conf_thres).nonzero(as_tuple=False).T
	x = torch.cat((box[i], x[i, j + 15, None], x[i, 5:15] ,j[:, None].float()), 1)
	else: # best class only
	conf, j = x[:, 15:].max(1, keepdim=True)
	x = torch.cat((box, conf, x[:, 5:15], j.float()), 1)[conf.view(-1) > conf_thres]

	# Filter by class
	if classes is not None:
	x = x[(x[:, 5:6] == torch.tensor(classes, device=x.device)).any(1)]

	# If none remain process next image
	n = x.shape[0] # number of boxes
	if not n:
	continue

	# Batched NMS
	c = x[:, 15:16] * (0 if agnostic else max_wh) # classes
	boxes, scores = x[:, :4] + c, x[:, 4] # boxes (offset by class), scores
	i = torchvision.ops.nms(boxes, scores, iou_thres) # NMS
	#if i.shape[0] > max_det: # limit detections
	# i = i[:max_det]
	if merge and (1 < n < 3E3): # Merge NMS (boxes merged using weighted mean)
	# update boxes as boxes(i,4) = weights(i,n) * boxes(n,4)
	iou = box_iou(boxes[i], boxes) > iou_thres # iou matrix
	weights = iou * scores[None] # box weights
	x[i, :4] = torch.mm(weights, x[:, :4]).float() / weights.sum(1, keepdim=True) # merged boxes
	if redundant:
	i = i[iou.sum(1) > 1] # require redundancy

	output[xi] = x[i]
	if (time.time() - t) > time_limit:
	break # time limit exceeded

	return output

	def scale_coords_landmarks(img1_shape, coords, img0_shape, ratio_pad=None):
	# Rescale coords (xyxy) from img1_shape to img0_shape
	if ratio_pad is None: # calculate from img0_shape
	gain = min(img1_shape[0] / img0_shape[0], img1_shape[1] / img0_shape[1]) # gain = old / new
	pad = (img1_shape[1] - img0_shape[1] * gain) / 2, (img1_shape[0] - img0_shape[0] * gain) / 2 # wh padding
	else:
	gain = ratio_pad[0][0]
	pad = ratio_pad[1]

	coords[:, [0, 2, 4, 6, 8]] -= pad[0] # x padding
	coords[:, [1, 3, 5, 7, 9]] -= pad[1] # y padding
	coords[:, :10] /= gain
	coords[:, 0].clamp_(0, img0_shape[1]) # x1
	coords[:, 1].clamp_(0, img0_shape[0]) # y1
	coords[:, 2].clamp_(0, img0_shape[1]) # x2
	coords[:, 3].clamp_(0, img0_shape[0]) # y2
	coords[:, 4].clamp_(0, img0_shape[1]) # x3
	coords[:, 5].clamp_(0, img0_shape[0]) # y3
	coords[:, 6].clamp_(0, img0_shape[1]) # x4
	coords[:, 7].clamp_(0, img0_shape[0]) # y4
	coords[:, 8].clamp_(0, img0_shape[1]) # x5
	coords[:, 9].clamp_(0, img0_shape[0]) # y5
	return coords

	def letterbox(img, new_shape=(640, 640), color=(114, 114, 114), auto=False, scaleFill=False, scaleup=True):
	# Resize image to a 32-pixel-multiple rectangle https://github.com/ultralytics/yolov3/issues/232
	shape = img.shape[:2] # current shape [height, width]
	if isinstance(new_shape, int):
	new_shape = (new_shape, new_shape)

	# Scale ratio (new / old)
	r = min(new_shape[0] / shape[0], new_shape[1] / shape[1])
	if not scaleup: # only scale down, do not scale up (for better test mAP)
	r = min(r, 1.0)


	# Compute padding
	ratio = r, r # width, height ratios
	new_unpad = int(round(shape[1] * r)), int(round(shape[0] * r))
	dw, dh = new_shape[1] - new_unpad[0], new_shape[0] - new_unpad[1] # wh padding
	#(dw, dh)
	if auto: # minimum rectangle
	dw, dh = np.mod(dw, 64), np.mod(dh, 64) # wh padding
	#print(dw, dh)
	elif scaleFill: # stretch
	dw, dh = 0.0, 0.0
	new_unpad = (new_shape[1], new_shape[0])
	ratio = new_shape[1] / shape[1], new_shape[0] / shape[0] # width, height ratios

	dw /= 2 # divide padding into 2 sides
	dh /= 2

	if shape[::-1] != new_unpad: # resize
	img = cv2.resize(img, new_unpad, interpolation=cv2.INTER_LINEAR)
	top, bottom = int(round(dh - 0.1)), int(round(dh + 0.1))
	left, right = int(round(dw - 0.1)), int(round(dw + 0.1))
	img = cv2.copyMakeBorder(img, top, bottom, left, right, cv2.BORDER_CONSTANT, value=color) # add border
	return img, ratio, (dw, dh)