Spaces:

teemosliang
/

SDPose

Running on Zero

App Files Files Community

SDPose / mmpose /evaluation /functional /nms.py

teemosliang

realease: publish the huggingface space demo of SDPose

d5532b9 verified about 1 month ago

raw

history blame contribute delete

11.3 kB

	# Copyright (c) Meta Platforms, Inc. and affiliates.
	# All rights reserved.
	#
	# This source code is licensed under the license found in the
	# LICENSE file in the root directory of this source tree.

	# ------------------------------------------------------------------------------
	# Adapted from https://github.com/leoxiaobin/deep-high-resolution-net.pytorch
	# and https://github.com/HRNet/DEKR
	# Original licence: Copyright (c) Microsoft, under the MIT License.
	# ------------------------------------------------------------------------------

	from typing import List, Optional

	import numpy as np


	def nms(dets: np.ndarray, thr: float) -> List[int]:
	"""Greedily select boxes with high confidence and overlap <= thr.

	Args:
	dets (np.ndarray): [[x1, y1, x2, y2, score]].
	thr (float): Retain overlap < thr.

	Returns:
	list: Indexes to keep.
	"""
	if len(dets) == 0:
	return []

	x1 = dets[:, 0]
	y1 = dets[:, 1]
	x2 = dets[:, 2]
	y2 = dets[:, 3]
	scores = dets[:, 4]

	areas = (x2 - x1 + 1) * (y2 - y1 + 1)
	order = scores.argsort()[::-1]

	keep = []
	while len(order) > 0:
	i = order[0]
	keep.append(i)
	xx1 = np.maximum(x1[i], x1[order[1:]])
	yy1 = np.maximum(y1[i], y1[order[1:]])
	xx2 = np.minimum(x2[i], x2[order[1:]])
	yy2 = np.minimum(y2[i], y2[order[1:]])

	w = np.maximum(0.0, xx2 - xx1 + 1)
	h = np.maximum(0.0, yy2 - yy1 + 1)
	inter = w * h
	ovr = inter / (areas[i] + areas[order[1:]] - inter)

	inds = np.where(ovr <= thr)[0]
	order = order[inds + 1]

	return keep


	def oks_iou(g: np.ndarray,
	d: np.ndarray,
	a_g: float,
	a_d: np.ndarray,
	sigmas: Optional[np.ndarray] = None,
	vis_thr: Optional[float] = None) -> np.ndarray:
	"""Calculate oks ious.

	Note:

	- number of keypoints: K
	- number of instances: N

	Args:
	g (np.ndarray): The instance to calculate OKS IOU with other
	instances. Containing the keypoints coordinates. Shape: (K*3, )
	d (np.ndarray): The rest instances. Containing the keypoints
	coordinates. Shape: (N, K*3)
	a_g (float): Area of the ground truth object.
	a_d (np.ndarray): Area of the detected object. Shape: (N, )
	sigmas (np.ndarray, optional): Keypoint labelling uncertainty.
	Please refer to `COCO keypoint evaluation
	<https://cocodataset.org/#keypoints-eval>`__ for more details.
	If not given, use the sigmas on COCO dataset.
	If specified, shape: (K, ). Defaults to ``None``
	vis_thr(float, optional): Threshold of the keypoint visibility.
	If specified, will calculate OKS based on those keypoints whose
	visibility higher than vis_thr. If not given, calculate the OKS
	based on all keypoints. Defaults to ``None``

	Returns:
	np.ndarray: The oks ious.
	"""
	if sigmas is None:
	sigmas = np.array([
	.26, .25, .25, .35, .35, .79, .79, .72, .72, .62, .62, 1.07, 1.07,
	.87, .87, .89, .89
	]) / 10.0
	vars = (sigmas * 2)**2
	xg = g[0::3]
	yg = g[1::3]
	vg = g[2::3]
	ious = np.zeros(len(d), dtype=np.float32)
	for n_d in range(0, len(d)):
	xd = d[n_d, 0::3]
	yd = d[n_d, 1::3]
	vd = d[n_d, 2::3]
	dx = xd - xg
	dy = yd - yg
	e = (dx2 + dy2) / vars / ((a_g + a_d[n_d]) / 2 + np.spacing(1)) / 2
	if vis_thr is not None:
	ind = list((vg > vis_thr) & (vd > vis_thr))
	e = e[ind]
	ious[n_d] = np.sum(np.exp(-e)) / len(e) if len(e) != 0 else 0.0
	return ious


	def oks_nms(kpts_db: List[dict],
	thr: float,
	sigmas: Optional[np.ndarray] = None,
	vis_thr: Optional[float] = None,
	score_per_joint: bool = False):
	"""OKS NMS implementations.

	Args:
	kpts_db (List[dict]): The keypoints results of the same image.
	thr (float): The threshold of NMS. Will retain oks overlap < thr.
	sigmas (np.ndarray, optional): Keypoint labelling uncertainty.
	Please refer to `COCO keypoint evaluation
	<https://cocodataset.org/#keypoints-eval>`__ for more details.
	If not given, use the sigmas on COCO dataset. Defaults to ``None``
	vis_thr(float, optional): Threshold of the keypoint visibility.
	If specified, will calculate OKS based on those keypoints whose
	visibility higher than vis_thr. If not given, calculate the OKS
	based on all keypoints. Defaults to ``None``
	score_per_joint(bool): Whether the input scores (in kpts_db) are
	per-joint scores. Defaults to ``False``

	Returns:
	np.ndarray: indexes to keep.
	"""
	if len(kpts_db) == 0:
	return []

	if score_per_joint:
	scores = np.array([k['score'].mean() for k in kpts_db])
	else:
	scores = np.array([k['score'] for k in kpts_db])

	kpts = np.array([k['keypoints'].flatten() for k in kpts_db])
	areas = np.array([k['area'] for k in kpts_db])

	order = scores.argsort()[::-1]

	keep = []
	while len(order) > 0:
	i = order[0]
	keep.append(i)

	oks_ovr = oks_iou(kpts[i], kpts[order[1:]], areas[i], areas[order[1:]],
	sigmas, vis_thr)

	inds = np.where(oks_ovr <= thr)[0]
	order = order[inds + 1]

	keep = np.array(keep)

	return keep


	def _rescore(overlap: np.ndarray,
	scores: np.ndarray,
	thr: float,
	type: str = 'gaussian'):
	"""Rescoring mechanism gaussian or linear.

	Args:
	overlap (np.ndarray): The calculated oks ious.
	scores (np.ndarray): target scores.
	thr (float): retain oks overlap < thr.
	type (str): The rescoring type. Could be 'gaussian' or 'linear'.
	Defaults to ``'gaussian'``

	Returns:
	np.ndarray: indexes to keep
	"""
	assert len(overlap) == len(scores)
	assert type in ['gaussian', 'linear']

	if type == 'linear':
	inds = np.where(overlap >= thr)[0]
	scores[inds] = scores[inds] * (1 - overlap[inds])
	else:
	scores = scores * np.exp(-overlap**2 / thr)

	return scores


	def soft_oks_nms(kpts_db: List[dict],
	thr: float,
	max_dets: int = 20,
	sigmas: Optional[np.ndarray] = None,
	vis_thr: Optional[float] = None,
	score_per_joint: bool = False):
	"""Soft OKS NMS implementations.

	Args:
	kpts_db (List[dict]): The keypoints results of the same image.
	thr (float): The threshold of NMS. Will retain oks overlap < thr.
	max_dets (int): Maximum number of detections to keep. Defaults to 20
	sigmas (np.ndarray, optional): Keypoint labelling uncertainty.
	Please refer to `COCO keypoint evaluation
	<https://cocodataset.org/#keypoints-eval>`__ for more details.
	If not given, use the sigmas on COCO dataset. Defaults to ``None``
	vis_thr(float, optional): Threshold of the keypoint visibility.
	If specified, will calculate OKS based on those keypoints whose
	visibility higher than vis_thr. If not given, calculate the OKS
	based on all keypoints. Defaults to ``None``
	score_per_joint(bool): Whether the input scores (in kpts_db) are
	per-joint scores. Defaults to ``False``

	Returns:
	np.ndarray: indexes to keep.
	"""
	if len(kpts_db) == 0:
	return []

	if score_per_joint:
	scores = np.array([k['score'].mean() for k in kpts_db])
	else:
	scores = np.array([k['score'] for k in kpts_db])

	kpts = np.array([k['keypoints'].flatten() for k in kpts_db])
	areas = np.array([k['area'] for k in kpts_db])

	order = scores.argsort()[::-1]
	scores = scores[order]

	keep = np.zeros(max_dets, dtype=np.intp)
	keep_cnt = 0
	while len(order) > 0 and keep_cnt < max_dets:
	i = order[0]

	oks_ovr = oks_iou(kpts[i], kpts[order[1:]], areas[i], areas[order[1:]],
	sigmas, vis_thr)

	order = order[1:]
	scores = _rescore(oks_ovr, scores[1:], thr)

	tmp = scores.argsort()[::-1]
	order = order[tmp]
	scores = scores[tmp]

	keep[keep_cnt] = i
	keep_cnt += 1

	keep = keep[:keep_cnt]

	return keep


	def nearby_joints_nms(
	kpts_db: List[dict],
	dist_thr: float,
	num_nearby_joints_thr: Optional[int] = None,
	score_per_joint: bool = False,
	max_dets: int = 30,
	):
	"""Nearby joints NMS implementations. Instances with non-maximum scores
	will be suppressed if they have too much closed joints with other
	instances. This function is modified from project
	`DEKR<https://github.com/HRNet/DEKR/blob/main/lib/core/nms.py>`.

	Args:
	kpts_db (list[dict]): keypoints and scores.
	dist_thr (float): threshold for judging whether two joints are close.
	num_nearby_joints_thr (int): threshold for judging whether two
	instances are close.
	max_dets (int): max number of detections to keep.
	score_per_joint (bool): the input scores (in kpts_db) are per joint
	scores.

	Returns:
	np.ndarray: indexes to keep.
	"""

	assert dist_thr > 0, '`dist_thr` must be greater than 0.'
	if len(kpts_db) == 0:
	return []

	if score_per_joint:
	scores = np.array([k['score'].mean() for k in kpts_db])
	else:
	scores = np.array([k['score'] for k in kpts_db])

	kpts = np.array([k['keypoints'] for k in kpts_db])

	num_people, num_joints, _ = kpts.shape
	if num_nearby_joints_thr is None:
	num_nearby_joints_thr = num_joints // 2
	assert num_nearby_joints_thr < num_joints, '`num_nearby_joints_thr` must '\
	'be less than the number of joints.'

	# compute distance threshold
	pose_area = kpts.max(axis=1) - kpts.min(axis=1)
	pose_area = np.sqrt(np.power(pose_area, 2).sum(axis=1))
	pose_area = pose_area.reshape(num_people, 1, 1)
	pose_area = np.tile(pose_area, (num_people, num_joints))
	close_dist_thr = pose_area * dist_thr

	# count nearby joints between instances
	instance_dist = kpts[:, None] - kpts
	instance_dist = np.sqrt(np.power(instance_dist, 2).sum(axis=3))
	close_instance_num = (instance_dist < close_dist_thr).sum(2)
	close_instance = close_instance_num > num_nearby_joints_thr

	# apply nms
	ignored_pose_inds, keep_pose_inds = set(), list()
	indexes = np.argsort(scores)[::-1]
	for i in indexes:
	if i in ignored_pose_inds:
	continue
	keep_inds = close_instance[i].nonzero()[0]
	keep_ind = keep_inds[np.argmax(scores[keep_inds])]
	if keep_ind not in ignored_pose_inds:
	keep_pose_inds.append(keep_ind)
	ignored_pose_inds = ignored_pose_inds.union(set(keep_inds))

	# limit the number of output instances
	if max_dets > 0 and len(keep_pose_inds) > max_dets:
	sub_inds = np.argsort(scores[keep_pose_inds])[-1:-max_dets - 1:-1]
	keep_pose_inds = [keep_pose_inds[i] for i in sub_inds]

	return keep_pose_inds