SoftwareGroup_BinocularSonar
/
mmpose


			
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443
							# Copyright (c) OpenMMLab. All rights reserved.
from unittest import TestCase

import numpy as np
from mmengine.structures import InstanceData

from mmpose.datasets.datasets.utils import parse_pose_metainfo
from mmpose.evaluation.metrics import (AUC, EPE, NME, JhmdbPCKAccuracy,
                                       MpiiPCKAccuracy, PCKAccuracy)


class TestPCKAccuracy(TestCase):

    def setUp(self):
        """Setup some variables which are used in every test method.

        TestCase calls functions in this order: setUp() -> testMethod() ->
        tearDown() -> cleanUp()
        """
        self.batch_size = 8
        num_keypoints = 15
        self.data_batch = []
        self.data_samples = []

        for i in range(self.batch_size):
            gt_instances = InstanceData()
            keypoints = np.zeros((1, num_keypoints, 2))
            keypoints[0, i] = [0.5 * i, 0.5 * i]
            gt_instances.keypoints = keypoints
            gt_instances.keypoints_visible = np.ones(
                (1, num_keypoints, 1)).astype(bool)
            gt_instances.keypoints_visible[0, (2 * i) % 8, 0] = False
            gt_instances.bboxes = np.random.random((1, 4)) * 20 * i
            gt_instances.head_size = np.random.random((1, 1)) * 10 * i

            pred_instances = InstanceData()
            pred_instances.keypoints = keypoints

            data = {'inputs': None}
            data_sample = {
                'gt_instances': gt_instances.to_dict(),
                'pred_instances': pred_instances.to_dict(),
            }

            self.data_batch.append(data)
            self.data_samples.append(data_sample)

    def test_init(self):
        """test metric init method."""
        # test invalid normalized_items
        with self.assertRaisesRegex(
                KeyError, "Should be one of 'bbox', 'head', 'torso'"):
            PCKAccuracy(norm_item='invalid')

    def test_evaluate(self):
        """test PCK accuracy evaluation metric."""
        # test normalized by 'bbox'
        pck_metric = PCKAccuracy(thr=0.5, norm_item='bbox')
        pck_metric.process(self.data_batch, self.data_samples)
        pck = pck_metric.evaluate(self.batch_size)
        target = {'PCK': 1.0}
        self.assertDictEqual(pck, target)

        # test normalized by 'head_size'
        pckh_metric = PCKAccuracy(thr=0.3, norm_item='head')
        pckh_metric.process(self.data_batch, self.data_samples)
        pckh = pckh_metric.evaluate(self.batch_size)
        target = {'PCKh': 1.0}
        self.assertDictEqual(pckh, target)

        # test normalized by 'torso_size'
        tpck_metric = PCKAccuracy(thr=0.05, norm_item=['bbox', 'torso'])
        tpck_metric.process(self.data_batch, self.data_samples)
        tpck = tpck_metric.evaluate(self.batch_size)
        self.assertIsInstance(tpck, dict)
        target = {
            'PCK': 1.0,
            'tPCK': 1.0,
        }
        self.assertDictEqual(tpck, target)


class TestMpiiPCKAccuracy(TestCase):

    def setUp(self):
        """Setup some variables which are used in every test method.

        TestCase calls functions in this order: setUp() -> testMethod() ->
        tearDown() -> cleanUp()
        """
        self.batch_size = 8
        num_keypoints = 16
        self.data_batch = []
        self.data_samples = []

        for i in range(self.batch_size):
            gt_instances = InstanceData()
            keypoints = np.zeros((1, num_keypoints, 2))
            keypoints[0, i] = [0.5 * i, 0.5 * i]
            gt_instances.keypoints = keypoints + 1.0
            gt_instances.keypoints_visible = np.ones(
                (1, num_keypoints, 1)).astype(bool)
            gt_instances.keypoints_visible[0, (2 * i) % 8, 0] = False
            gt_instances.bboxes = np.random.random((1, 4)) * 20 * i
            gt_instances.head_size = np.random.random((1, 1)) * 10 * i

            pred_instances = InstanceData()
            pred_instances.keypoints = keypoints

            data = {'inputs': None}
            data_sample = {
                'gt_instances': gt_instances.to_dict(),
                'pred_instances': pred_instances.to_dict(),
            }

            self.data_batch.append(data)
            self.data_samples.append(data_sample)

    def test_init(self):
        """test metric init method."""
        # test invalid normalized_items
        with self.assertRaisesRegex(
                KeyError, "Should be one of 'bbox', 'head', 'torso'"):
            MpiiPCKAccuracy(norm_item='invalid')

    def test_evaluate(self):
        """test PCK accuracy evaluation metric."""
        # test normalized by 'head_size'
        mpii_pck_metric = MpiiPCKAccuracy(thr=0.3, norm_item='head')
        mpii_pck_metric.process(self.data_batch, self.data_samples)
        pck_results = mpii_pck_metric.evaluate(self.batch_size)
        target = {
            'Head PCK': 100.0,
            'Shoulder PCK': 100.0,
            'Elbow PCK': 100.0,
            'Wrist PCK': 100.0,
            'Hip PCK': 100.0,
            'Knee PCK': 100.0,
            'Ankle PCK': 100.0,
            'PCK': 100.0,
            'PCK@0.1': 100.0,
        }
        self.assertDictEqual(pck_results, target)


class TestJhmdbPCKAccuracy(TestCase):

    def setUp(self):
        """Setup some variables which are used in every test method.

        TestCase calls functions in this order: setUp() -> testMethod() ->
        tearDown() -> cleanUp()
        """
        self.batch_size = 8
        num_keypoints = 15
        self.data_batch = []
        self.data_samples = []

        for i in range(self.batch_size):
            gt_instances = InstanceData()
            keypoints = np.zeros((1, num_keypoints, 2))
            keypoints[0, i] = [0.5 * i, 0.5 * i]
            gt_instances.keypoints = keypoints
            gt_instances.keypoints_visible = np.ones(
                (1, num_keypoints, 1)).astype(bool)
            gt_instances.keypoints_visible[0, (2 * i) % 8, 0] = False
            gt_instances.bboxes = np.random.random((1, 4)) * 20 * i
            gt_instances.head_size = np.random.random((1, 1)) * 10 * i

            pred_instances = InstanceData()
            pred_instances.keypoints = keypoints

            data = {'inputs': None}
            data_sample = {
                'gt_instances': gt_instances.to_dict(),
                'pred_instances': pred_instances.to_dict(),
            }

            self.data_batch.append(data)
            self.data_samples.append(data_sample)

    def test_init(self):
        """test metric init method."""
        # test invalid normalized_items
        with self.assertRaisesRegex(
                KeyError, "Should be one of 'bbox', 'head', 'torso'"):
            JhmdbPCKAccuracy(norm_item='invalid')

    def test_evaluate(self):
        """test PCK accuracy evaluation metric."""
        # test normalized by 'bbox_size'
        jhmdb_pck_metric = JhmdbPCKAccuracy(thr=0.5, norm_item='bbox')
        jhmdb_pck_metric.process(self.data_batch, self.data_samples)
        pck_results = jhmdb_pck_metric.evaluate(self.batch_size)
        target = {
            'Head PCK': 1.0,
            'Sho PCK': 1.0,
            'Elb PCK': 1.0,
            'Wri PCK': 1.0,
            'Hip PCK': 1.0,
            'Knee PCK': 1.0,
            'Ank PCK': 1.0,
            'PCK': 1.0,
        }
        self.assertDictEqual(pck_results, target)

        # test normalized by 'torso_size'
        jhmdb_tpck_metric = JhmdbPCKAccuracy(thr=0.2, norm_item='torso')
        jhmdb_tpck_metric.process(self.data_batch, self.data_samples)
        tpck_results = jhmdb_tpck_metric.evaluate(self.batch_size)
        target = {
            'Head tPCK': 1.0,
            'Sho tPCK': 1.0,
            'Elb tPCK': 1.0,
            'Wri tPCK': 1.0,
            'Hip tPCK': 1.0,
            'Knee tPCK': 1.0,
            'Ank tPCK': 1.0,
            'tPCK': 1.0,
        }
        self.assertDictEqual(tpck_results, target)


class TestAUCandEPE(TestCase):

    def setUp(self):
        """Setup some variables which are used in every test method.

        TestCase calls functions in this order: setUp() -> testMethod() ->
        tearDown() -> cleanUp()
        """
        output = np.zeros((1, 5, 2))
        target = np.zeros((1, 5, 2))
        # first channel
        output[0, 0] = [10, 4]
        target[0, 0] = [10, 0]
        # second channel
        output[0, 1] = [10, 18]
        target[0, 1] = [10, 10]
        # third channel
        output[0, 2] = [0, 0]
        target[0, 2] = [0, -1]
        # fourth channel
        output[0, 3] = [40, 40]
        target[0, 3] = [30, 30]
        # fifth channel
        output[0, 4] = [20, 10]
        target[0, 4] = [0, 10]

        gt_instances = InstanceData()
        gt_instances.keypoints = target
        gt_instances.keypoints_visible = np.array(
            [[True, True, False, True, True]])

        pred_instances = InstanceData()
        pred_instances.keypoints = output

        data = {'inputs': None}
        data_sample = {
            'gt_instances': gt_instances.to_dict(),
            'pred_instances': pred_instances.to_dict()
        }

        self.data_batch = [data]
        self.data_samples = [data_sample]

    def test_auc_evaluate(self):
        """test AUC evaluation metric."""
        auc_metric = AUC(norm_factor=20, num_thrs=4)
        auc_metric.process(self.data_batch, self.data_samples)
        auc = auc_metric.evaluate(1)
        target = {'AUC': 0.375}
        self.assertDictEqual(auc, target)

    def test_epe_evaluate(self):
        """test EPE evaluation metric."""
        epe_metric = EPE()
        epe_metric.process(self.data_batch, self.data_samples)
        epe = epe_metric.evaluate(1)
        self.assertAlmostEqual(epe['EPE'], 11.5355339)


class TestNME(TestCase):

    def _generate_data(self,
                       batch_size: int = 1,
                       num_keypoints: int = 5,
                       norm_item: str = 'box_size') -> tuple:
        """Generate data_batch and data_samples according to different
        settings."""
        data_batch = []
        data_samples = []

        for i in range(batch_size):
            gt_instances = InstanceData()
            keypoints = np.zeros((1, num_keypoints, 2))
            keypoints[0, i] = [0.5 * i, 0.5 * i]
            gt_instances.keypoints = keypoints
            gt_instances.keypoints_visible = np.ones(
                (1, num_keypoints, 1)).astype(bool)
            gt_instances.keypoints_visible[0, (2 * i) % batch_size, 0] = False
            gt_instances[norm_item] = np.random.random((1, 1)) * 20 * i

            pred_instances = InstanceData()
            pred_instances.keypoints = keypoints

            data = {'inputs': None}
            data_sample = {
                'gt_instances': gt_instances.to_dict(),
                'pred_instances': pred_instances.to_dict(),
            }
            data_batch.append(data)
            data_samples.append(data_sample)

        return data_batch, data_samples

    def test_nme_evaluate(self):
        """test NME evaluation metric."""
        # test when norm_mode = 'use_norm_item'
        # test norm_item = 'box_size' like in `AFLWDataset`
        norm_item = 'box_size'
        nme_metric = NME(norm_mode='use_norm_item', norm_item=norm_item)
        aflw_meta_info = dict(from_file='configs/_base_/datasets/aflw.py')
        aflw_dataset_meta = parse_pose_metainfo(aflw_meta_info)
        nme_metric.dataset_meta = aflw_dataset_meta

        data_batch, data_samples = self._generate_data(
            batch_size=4, num_keypoints=19, norm_item=norm_item)
        nme_metric.process(data_batch, data_samples)
        nme = nme_metric.evaluate(4)
        target = {'NME': 0.0}
        self.assertDictEqual(nme, target)

        # test when norm_mode = 'keypoint_distance'
        # when `keypoint_indices = None`,
        # use default `keypoint_indices` like in `Horse10Dataset`
        nme_metric = NME(norm_mode='keypoint_distance')
        horse10_meta_info = dict(
            from_file='configs/_base_/datasets/horse10.py')
        horse10_dataset_meta = parse_pose_metainfo(horse10_meta_info)
        nme_metric.dataset_meta = horse10_dataset_meta

        data_batch, data_samples = self._generate_data(
            batch_size=4, num_keypoints=22)
        nme_metric.process(data_batch, data_samples)
        nme = nme_metric.evaluate(4)

        target = {'NME': 0.0}
        self.assertDictEqual(nme, target)

        # test when norm_mode = 'keypoint_distance'
        # specify custom `keypoint_indices`
        keypoint_indices = [2, 4]
        nme_metric = NME(
            norm_mode='keypoint_distance', keypoint_indices=keypoint_indices)
        coco_meta_info = dict(from_file='configs/_base_/datasets/coco.py')
        coco_dataset_meta = parse_pose_metainfo(coco_meta_info)
        nme_metric.dataset_meta = coco_dataset_meta

        data_batch, data_samples = self._generate_data(
            batch_size=2, num_keypoints=17)
        nme_metric.process(data_batch, data_samples)
        nme = nme_metric.evaluate(2)

        target = {'NME': 0.0}
        self.assertDictEqual(nme, target)

    def test_exceptions_and_warnings(self):
        """test exceptions and warnings."""
        # test invalid norm_mode
        with self.assertRaisesRegex(
                KeyError,
                "`norm_mode` should be 'use_norm_item' or 'keypoint_distance'"
        ):
            nme_metric = NME(norm_mode='invalid')

        # test when norm_mode = 'use_norm_item' but do not specify norm_item
        with self.assertRaisesRegex(
                KeyError, '`norm_mode` is set to `"use_norm_item"`, '
                'please specify the `norm_item`'):
            nme_metric = NME(norm_mode='use_norm_item', norm_item=None)

        # test when norm_mode = 'use_norm_item'
        # but the `norm_item` do not in data_info
        with self.assertRaisesRegex(
                AssertionError,
                'The ground truth data info do not have the expected '
                'normalized factor'):
            nme_metric = NME(norm_mode='use_norm_item', norm_item='norm_item1')
            coco_meta_info = dict(from_file='configs/_base_/datasets/coco.py')
            coco_dataset_meta = parse_pose_metainfo(coco_meta_info)
            nme_metric.dataset_meta = coco_dataset_meta

            data_batch, data_samples = self._generate_data(
                norm_item='norm_item2')
            # raise AssertionError here
            nme_metric.process(data_batch, data_samples)

        # test when norm_mode = 'keypoint_distance', `keypoint_indices` = None
        # but the dataset_name not in `DEFAULT_KEYPOINT_INDICES`
        with self.assertRaisesRegex(
                KeyError, 'can not find the keypoint_indices in '
                '`DEFAULT_KEYPOINT_INDICES`'):
            nme_metric = NME(
                norm_mode='keypoint_distance', keypoint_indices=None)
            coco_meta_info = dict(from_file='configs/_base_/datasets/coco.py')
            coco_dataset_meta = parse_pose_metainfo(coco_meta_info)
            nme_metric.dataset_meta = coco_dataset_meta

            data_batch, data_samples = self._generate_data()
            nme_metric.process(data_batch, data_samples)
            # raise KeyError here
            _ = nme_metric.evaluate(1)

        # test when len(keypoint_indices) is not 2
        with self.assertRaisesRegex(
                AssertionError,
                'The keypoint indices used for normalization should be a pair.'
        ):
            nme_metric = NME(
                norm_mode='keypoint_distance', keypoint_indices=[0, 1, 2])
            coco_meta_info = dict(from_file='configs/_base_/datasets/coco.py')
            coco_dataset_meta = parse_pose_metainfo(coco_meta_info)
            nme_metric.dataset_meta = coco_dataset_meta

            data_batch, data_samples = self._generate_data()
            nme_metric.process(data_batch, data_samples)
            # raise AssertionError here
            _ = nme_metric.evaluate(1)

        # test when dataset does not contain the required keypoint
        with self.assertRaisesRegex(AssertionError,
                                    'dataset does not contain the required'):
            nme_metric = NME(
                norm_mode='keypoint_distance', keypoint_indices=[17, 18])
            coco_meta_info = dict(from_file='configs/_base_/datasets/coco.py')
            coco_dataset_meta = parse_pose_metainfo(coco_meta_info)
            nme_metric.dataset_meta = coco_dataset_meta

            data_batch, predidata_samplesctions = self._generate_data()
            nme_metric.process(data_batch, data_samples)
            # raise AssertionError here
            _ = nme_metric.evaluate(1)