open-mmlab · LareinaM · Feb 17, 2023 · Feb 22, 2023 · Mar 8, 2023 · Mar 8, 2023
@@ -48,3 +48,4 @@ Metrics
    ConnectivityError
    DOTAMeanAP
    ROUGE
+   COCOKeyPointDetection
@@ -48,3 +48,4 @@ Metrics
    ConnectivityError
    DOTAMeanAP
    ROUGE
+   COCOKeyPointDetection
@@ -6,6 +6,7 @@
 from .ava_map import AVAMeanAP
 from .bleu import BLEU
 from .coco_detection import COCODetection
+from .coco_pose import COCOKeyPointDetection
 from .connectivity_error import ConnectivityError
 from .dota_map import DOTAMeanAP
 from .end_point_error import EndPointError
@@ -36,7 +37,7 @@
     'StructuralSimilarity', 'SignalNoiseRatio', 'MultiLabelMetric',
     'AveragePrecision', 'AVAMeanAP', 'BLEU', 'DOTAMeanAP',
     'SumAbsoluteDifferences', 'GradientError', 'MattingMeanSquaredError',
-    'ConnectivityError', 'ROUGE'
+    'ConnectivityError', 'ROUGE', 'COCOKeyPointDetection'
 ]
 
 _deprecated_msg = (
@@ -46,6 +47,7 @@
 
 __deprecated_metric_names__ = {
     'COCODetectionMetric': 'COCODetection',
+    'COCOPoseMetric': 'COCOKeyPointDetection',
     'F1Metric': 'F1Score',
     'MAE': 'MeanAbsoluteError',
     'MSE': 'MeanSquaredError',

@@ -5,6 +5,7 @@
 from .grammar import get_n_gram, get_tokenizer, infer_language
 from .image_transforms import reorder_and_crop
 from .keypoint import calc_distances, distance_acc
+from .nms import nms, oks_nms, soft_oks_nms
 from .polygon import (poly2shapely, poly_intersection, poly_iou,
                       poly_make_valid, poly_union, polys2shapely)
 
@@ -13,5 +14,6 @@
     'poly_make_valid', 'poly_iou', 'calc_distances', 'distance_acc',
     'calculate_overlaps', 'calculate_bboxes_area', 'reorder_and_crop',
     'calculate_bboxes_area_rotated', 'calculate_overlaps_rotated',
-    'get_n_gram', 'get_tokenizer', 'infer_language'
+    'get_n_gram', 'get_tokenizer', 'infer_language', 'nms', 'oks_nms',
+    'soft_oks_nms'
 ]
@@ -0,0 +1,250 @@
+# ------------------------------------------------------------------------------
+# Adapted from https://github.com/leoxiaobin/deep-high-resolution-net.pytorch
+# Original licence: Copyright (c) Microsoft, under the MIT License.
+# ------------------------------------------------------------------------------
+
+import numpy as np
+from typing import List, Optional
+
+
+def nms(dets: np.ndarray, thr: float) -> List[int]:
+    """Greedily select boxes with high confidence and overlap <= thr.
+
+    Args:
+        dets (np.ndarray): [[x1, y1, x2, y2, score]].
+        thr (float): Retain overlap < thr.
+
+    Returns:
+        list: Indexes to keep.
+    """
+    if len(dets) == 0:
+        return []
+
+    x1 = dets[:, 0]
+    y1 = dets[:, 1]
+    x2 = dets[:, 2]
+    y2 = dets[:, 3]
+    scores = dets[:, 4]
+
+    areas = (x2 - x1 + 1) * (y2 - y1 + 1)
+    order = scores.argsort()[::-1]
+
+    keep = []
+    while len(order) > 0:
+        i = order[0]
+        keep.append(i)
+        xx1 = np.maximum(x1[i], x1[order[1:]])
+        yy1 = np.maximum(y1[i], y1[order[1:]])
+        xx2 = np.minimum(x2[i], x2[order[1:]])
+        yy2 = np.minimum(y2[i], y2[order[1:]])
+
+        w = np.maximum(0.0, xx2 - xx1 + 1)
+        h = np.maximum(0.0, yy2 - yy1 + 1)
+        inter = w * h
+        ovr = inter / (areas[i] + areas[order[1:]] - inter)
+
+        inds = np.where(ovr <= thr)[0]
+        order = order[inds + 1]
+
+    return keep
+
+
+def oks_iou(g: np.ndarray,
+            d: np.ndarray,
+            a_g: float,
+            a_d: np.ndarray,
+            sigmas: Optional[np.ndarray] = None,
+            vis_thr: Optional[float] = None) -> np.ndarray:
+    """Calculate oks ious.
+
+    Note:
+
+        - number of keypoints: K
+        - number of instances: N
+
+    Args:
+        g (np.ndarray): The instance to calculate OKS IOU with other
+            instances. Containing the keypoints coordinates. Shape: (K*3, )
+        d (np.ndarray): The rest instances. Containing the keypoints
+            coordinates. Shape: (N, K*3)
+        a_g (float): Area of the ground truth object.
+        a_d (np.ndarray): Area of the detected object. Shape: (N, )
+        sigmas (np.ndarray, optional): Keypoint labelling uncertainty.
+            Please refer to `COCO keypoint evaluation
+            <https://cocodataset.org/#keypoints-eval>`__ for more details.
+            If not given, use the sigmas on COCO dataset.
+            If specified, shape: (K, ). Defaults to ``None``
+        vis_thr(float, optional): Threshold of the keypoint visibility.
+            If specified, will calculate OKS based on those keypoints whose
+            visibility higher than vis_thr. If not given, calculate the OKS
+            based on all keypoints. Defaults to ``None``
+
+    Returns:
+        np.ndarray: The oks ious.
+    """
+    if sigmas is None:
+        sigmas = np.array([
+            .26, .25, .25, .35, .35, .79, .79, .72, .72, .62, .62, 1.07, 1.07,
+            .87, .87, .89, .89
+        ]) / 10.0
+    vars = (sigmas * 2)**2
+    xg = g[0::3]
+    yg = g[1::3]
+    vg = g[2::3]
+    ious = np.zeros(len(d), dtype=np.float32)
+    for n_d in range(0, len(d)):
+        xd = d[n_d, 0::3]
+        yd = d[n_d, 1::3]
+        vd = d[n_d, 2::3]
+        dx = xd - xg
+        dy = yd - yg
+        e = (dx**2 + dy**2) / vars / ((a_g + a_d[n_d]) / 2 + np.spacing(1)) / 2
+        if vis_thr is not None:
+            ind = list(vg > vis_thr) and list(vd > vis_thr)
+            e = e[ind]
+        ious[n_d] = np.sum(np.exp(-e)) / len(e) if len(e) != 0 else 0.0
+    return ious
+
+
+def oks_nms(kpts_db: List[dict],
+            thr: float,
+            sigmas: Optional[np.ndarray] = None,
+            vis_thr: Optional[float] = None,
+            score_per_joint: bool = False) -> np.ndarray:
+    """OKS NMS implementations.
+
+    Args:
+        kpts_db (List[dict]): The keypoints results of the same image.
+        thr (float): The threshold of NMS. Will retain oks overlap < thr.
+        sigmas (np.ndarray, optional): Keypoint labelling uncertainty.
+            Please refer to `COCO keypoint evaluation
+            <https://cocodataset.org/#keypoints-eval>`__ for more details.
+            If not given, use the sigmas on COCO dataset. Defaults to ``None``
+        vis_thr(float, optional): Threshold of the keypoint visibility.
+            If specified, will calculate OKS based on those keypoints whose
+            visibility higher than vis_thr. If not given, calculate the OKS
+            based on all keypoints. Defaults to ``None``
+        score_per_joint(bool): Whether the input scores (in kpts_db) are
+            per-joint scores. Defaults to ``False``
+
+    Returns:
+        np.ndarray: indexes to keep.
+    """
+    if len(kpts_db) == 0:
+        return []
+
+    if score_per_joint:
+        scores = np.array([k['score'].mean() for k in kpts_db])
+    else:
+        scores = np.array([k['score'] for k in kpts_db])
+
+    kpts = np.array([k['keypoints'].flatten() for k in kpts_db])
+    areas = np.array([k['area'] for k in kpts_db])
+
+    order = scores.argsort()[::-1]
+
+    keep = []
+    while len(order) > 0:
+        i = order[0]
+        keep.append(i)
+
+        oks_ovr = oks_iou(kpts[i], kpts[order[1:]], areas[i], areas[order[1:]],
+                          sigmas, vis_thr)
+
+        inds = np.where(oks_ovr <= thr)[0]
+        order = order[inds + 1]
+
+    keep = np.array(keep)
+
+    return keep
+
+
+def _rescore(overlap: np.ndarray,
+             scores: np.ndarray,
+             thr: float,
+             type: str = 'gaussian') -> np.ndarray:
+    """Rescoring mechanism gaussian or linear.
+
+    Args:
+        overlap (np.ndarray): The calculated oks ious.
+        scores (np.ndarray): target scores.
+        thr (float): retain oks overlap < thr.
+        type (str): The rescoring type. Could be 'gaussian' or 'linear'.
+            Defaults to ``'gaussian'``
+
+    Returns:
+        np.ndarray: indexes to keep
+    """
+    assert len(overlap) == len(scores)
+    assert type in ['gaussian', 'linear']
+
+    if type == 'linear':
+        inds = np.where(overlap >= thr)[0]
+        scores[inds] = scores[inds] * (1 - overlap[inds])
+    else:
+        scores = scores * np.exp(-overlap**2 / thr)
+
+    return scores
+
+
+def soft_oks_nms(kpts_db: List[dict],
+                 thr: float,
+                 max_dets: int = 20,
+                 sigmas: Optional[np.ndarray] = None,
+                 vis_thr: Optional[float] = None,
+                 score_per_joint: bool = False) -> np.ndarray:
+    """Soft OKS NMS implementations.
+
+    Args:
+        kpts_db (List[dict]): The keypoints results of the same image.
+        thr (float): The threshold of NMS. Will retain oks overlap < thr.
+        max_dets (int): Maximum number of detections to keep. Defaults to 20
+        sigmas (np.ndarray, optional): Keypoint labelling uncertainty.
+            Please refer to `COCO keypoint evaluation
+            <https://cocodataset.org/#keypoints-eval>`__ for more details.
+            If not given, use the sigmas on COCO dataset. Defaults to ``None``
+        vis_thr(float, optional): Threshold of the keypoint visibility.
+            If specified, will calculate OKS based on those keypoints whose
+            visibility higher than vis_thr. If not given, calculate the OKS
+            based on all keypoints. Defaults to ``None``
+        score_per_joint(bool): Whether the input scores (in kpts_db) are
+            per-joint scores. Defaults to ``False``
+
+    Returns:
+        np.ndarray: indexes to keep.
+    """
+    if len(kpts_db) == 0:
+        return []
+
+    if score_per_joint:
+        scores = np.array([k['score'].mean() for k in kpts_db])
+    else:
+        scores = np.array([k['score'] for k in kpts_db])
+
+    kpts = np.array([k['keypoints'].flatten() for k in kpts_db])
+    areas = np.array([k['area'] for k in kpts_db])
+
+    order = scores.argsort()[::-1]
+    scores = scores[order]
+
+    keep = np.zeros(max_dets, dtype=np.intp)
+    keep_cnt = 0
+    while len(order) > 0 and keep_cnt < max_dets:
+        i = order[0]
+
+        oks_ovr = oks_iou(kpts[i], kpts[order[1:]], areas[i], areas[order[1:]],
+                          sigmas, vis_thr)
+
+        order = order[1:]
+        scores = _rescore(oks_ovr, scores[1:], thr)
+
+        tmp = scores.argsort()[::-1]
+        order = order[tmp]
+        scores = scores[tmp]
+
+        keep[keep_cnt] = i
+        keep_cnt += 1
+
+    keep = keep[:keep_cnt]
+
+    return keep