Source code for playground_metrics.match_detections

"""Implement the public interface to match a set of detections and ground truths."""

from abc import ABC, abstractmethod

import numpy as np
from pygeos import area, is_empty, intersection

from .utils.geometry import GeometryType, intersection_over_union, is_type, euclidean_distance, as_boxes, \
    point_to_box, as_points


[docs]class MatchEngineBase(ABC):
    """Match detection with their ground truth according a similarity matrix and a detection confidence score.

    Matching may be done using coco algorithm or xView algorithm (which yield different matches as described for an
    intersection-over-union similarity matrix in :ref:`match`) or with non-unitary matching.

    Subclasses must implement :meth:`compute_similarity_matrix` and :meth:`trim_similarity_matrix` to be functional.

    Args:
        match_algorithm (str) : Either 'coco', 'xview' or 'non-unitary' to choose the match algorithm

    Attributes:
        match_algorithm (str) : Either 'coco', 'xview' or 'non-unitary' and indicates the match algorithm used

    """

    def __init__(self, match_algorithm):
        if match_algorithm not in ['coco', 'xview', 'non-unitary']:
            raise ValueError("match_algorithm must be either coco, xview or non-unitary")

        self.match_algorithm = match_algorithm

        # Authorized geometric types fot this match engine
        self._detection_types = (GeometryType.POLYGON, GeometryType.POINT)
        self._ground_truth_types = (GeometryType.POLYGON, GeometryType.POINT)

    def __repr__(self):
        """Represent the :class:`~playground_metrics.match_detections.MatchEngineBase` as a string."""
        d_arg = []
        for arg in ['threshold', 'match_algorithm', 'bounding_box_size']:
            if hasattr(self, arg):
                d_arg.append('{}={}'.format(arg, self.__getattribute__(arg)))
        return '{}({})'.format(self.__class__.__name__, ', '.join(d_arg))

    def __str__(self):
        """Represent the :class:`~playground_metrics.match_detections.MatchEngineBase` as a string."""
        d_arg = []
        for arg in ['threshold', 'match_algorithm', 'bounding_box_size']:
            if hasattr(self, arg):
                d_arg.append('{}={}'.format(arg, self.__getattribute__(arg)))
        return '{}({})'.format(self.__class__.__name__.replace('MatchEngine', ''), ', '.join(d_arg))

    def _compute_similarity_matrix_and_trim(self, detections, ground_truths, label_mean_area=None):
        similarity_matrix = self.compute_similarity_matrix(detections, ground_truths, label_mean_area)
        return similarity_matrix, self.trim_similarity_matrix(similarity_matrix, detections, ground_truths,
                                                              label_mean_area)

[docs]    @abstractmethod
    def compute_similarity_matrix(self, detections, ground_truths, label_mean_area=None):
        r"""Compute a similarity matrix between detections and ground truths.

        Abstract method.

        This method must be overridden in subsequent subclasses to handle both bounding box and polygon input format.

        Args:
            detections (ndarray, list) : A ndarray of detections stored as:

                * Bounding boxes for a given class where each row is a detection stored as:
                  ``[BoundingBox, confidence]``
                * Polygons for a given class where each row is a detection stored as:
                  ``[Polygon, confidence]``
                * Points for a given class where each row is a detection stored as:
                  ``[Point, confidence]``

            ground_truths (ndarray,list) : A ndarray of ground truth stored as:

                * Bounding boxes for a given class where each row is a ground truth stored as:
                  ``[BoundingBox]``
                * Polygons for a given class where each row is a ground truth stored as:
                  ``[Polygon]``
                * Points for a given class where each row is a ground truth stored as:
                  ``[Point]``

            label_mean_area (float) : Optional, default to ``None``. The mean area for each label in the dataset.

        Returns:
            ndarray : A similarity matrix of dimension (#detections, #ground truth)

        """
        raise NotImplementedError

[docs]    @abstractmethod
    def trim_similarity_matrix(self, similarity_matrix, detections, ground_truths,
                               label_mean_area=None):  # noqa: D205,D400
        r"""Compute an array containing the indices in columns of similarity passing the first trimming (typically for
        IoU this would be the result of a simple thresholding) but it might be any method fit to do a rough filtering of
        possible ground truth candidates to match with a given detection.

        Abstract method.

        Args:
            similarity_matrix: The similarity matrix between detections and ground truths : dimension (#detection, #gt)
            detections (ndarray, list) : A ndarray of detections stored as:

                * Bounding boxes for a given class where each row is a detection stored as:
                  ``[BoundingBox, confidence]``
                * Polygons for a given class where each row is a detection stored as:
                  ``[Polygon, confidence]``
                * Points for a given class where each row is a detection stored as:
                  ``[Point, confidence]``

            ground_truths (ndarray,list) : A ndarray of ground truth stored as:

                * Bounding boxes for a given class where each row is a ground truth stored as:
                  ``[BoundingBox]``
                * Polygons for a given class where each row is a ground truth stored as:
                  ``[Polygon]``
                * Points for a given class where each row is a ground truth stored as:
                  ``[Point]``

            label_mean_area (float) : Optional, default to ``None``. The mean area for each label in the dataset.

        Returns:
            ndarray: An array of dimension (2, N) where each column is a tuple (detection, ground truth) describing
            a potential match. To be more precise, each match-tuple in the array corresponds to a position in the
            similarity matrix which will be used by the match algorithm to compute the final match.

        """
        raise NotImplementedError

[docs]    def match(self, detections, ground_truths, label_mean_area=None):  # noqa: D205,D400
        r"""Match detections :class:`~playground_metrics.utils.geometry_utils.geometry.Geometry` with ground truth
        :class:`~playground_metrics.utils.geometry_utils.geometry.Geometry` at a given similarity matrix and trim
        method using either Coco algorithm, xView algorithm or a naive *non-unitary* match.

        Args:
            detections (ndarray, list) : A ndarray of detections stored as:

                * Bounding boxes for a given class where each row is a detection stored as:
                  ``[BoundingBox, confidence]``
                * Polygons for a given class where each row is a detection stored as:
                  ``[Polygon, confidence]``
                * Points for a given class where each row is a detection stored as:
                  ``[Point, confidence]``

            ground_truths (ndarray,list) : A ndarray of ground truth stored as:

                * Bounding boxes for a given class where each row is a ground truth stored as:
                  ``[BoundingBox]``
                * Polygons for a given class where each row is a ground truth stored as:
                  ``[Polygon]``
                * Points for a given class where each row is a ground truth stored as:
                  ``[Point]``

            label_mean_area (float) : Optional, default to ``None``. The mean area for each label in the dataset.

        Returns:
            ndarray : A binary matrix of all matches of dimension (#detections, #ground truth)

        """
        if detections.shape[0] == 0:
            return np.zeros((0, ground_truths.shape[0]))

        if ground_truths.shape[0] == 0:
            return np.zeros((detections.shape[0], 0))

        # Geometric static typing
        if not np.all(is_type(detections[:, 0], *self._detection_types)):
            raise TypeError('Invalid geometric type provided in '
                            'detections, expected to be on of {}'
                            ''.format(' '.join(['{}'.format(geom_type.name)
                                                for geom_type in self._detection_types])))
        if not np.all(is_type(ground_truths[:, 0], *self._ground_truth_types)):
            raise TypeError('Invalid geometric type provided in '
                            'detections, expected to be on of {}'
                            ''.format(' '.join(['{}'.format(geom_type.name)
                                                for geom_type in self._ground_truth_types])))

        # We sort detections by confidence before computing the similarity matrix
        detections = self._sort_detection_by_confidence(detections)

        # Compute similarity matrix and An array containing the indices in columns of similarity passing the first
        # trimming (Typically for IoU this would be the result of a simple thresholding).
        similarity_matrix, similarity_matches = self._compute_similarity_matrix_and_trim(detections,
                                                                                         ground_truths,
                                                                                         label_mean_area)

        # We match the detection and the ground truth using the configured algorithm
        if self.match_algorithm == 'coco':
            return self._coco_match(similarity_matrix, similarity_matches)
        if self.match_algorithm == 'non-unitary':
            return self._non_unitary_match(similarity_matrix, similarity_matches)
        if self.match_algorithm == 'xview':
            return self._xview_match(similarity_matrix, similarity_matches)
        raise ValueError('Invalid match algorithm: must be either coco, xview or non-unitary')

    @staticmethod
    def _sort_detection_by_confidence(detections):
        # We sort the detection by decreasing confidence
        sort_indices = np.argsort(detections[:, 1])[::-1]
        return detections[sort_indices, :]

    @staticmethod
    def _coco_match(similarity_matrix, similarity_matches):  # noqa: D205,D400
        r"""Match detections bounding boxes with ground truth bounding boxes for a given similarity matrix and trim
        method using Coco algorithm.

        Args:
            similarity_matrix: The similarity matrix between detections and ground truths : dimension (#detection, #gt)

        Returns:
            ndarray: A binary matrix of all matches of dimension (#detections, #ground truth)

        """
        # We prepare the detection match matrix
        match_matrix = np.zeros_like(similarity_matrix)

        if similarity_matches.shape[1] == 0:  # No matches at all
            return match_matrix

        forward = {match[0, 0]: match[1, :]
                   for match in np.hsplit(similarity_matches, np.where(np.diff(similarity_matches[0, :]) != 0)[0] + 1)}
        similarity_matches_by_gt = similarity_matches[:, np.argsort(similarity_matches[1, :])]
        backward = {match[1, 0]: match[0, :]
                    for match in np.hsplit(similarity_matches_by_gt,
                                           np.where(np.diff(similarity_matches_by_gt[1, :]) != 0)[0] + 1)}

        for k in range(similarity_matrix.shape[0]):
            # For each detection we select its ground truth match
            detection_matches = forward.get(k, np.zeros((0, 0)))

            # If we don't have anything left to match -> skip
            if detection_matches.size == 0:
                continue

            # We select the biggest similarity_matrix over them
            m = np.argmax(similarity_matrix[k, detection_matches])
            n = detection_matches[m]

            # We delete the ground truth column index from future match testing
            for d in backward[n]:
                forward[d] = forward[d][forward[d] != n]

            # We set the match flag to 1
            match_matrix[k, n] = 1

        return match_matrix

    @staticmethod
    def _xview_match(similarity_matrix, similarity_matches):  # noqa: D205,D400
        r"""Match detections bounding boxes with ground truth bounding boxes for a0 given similarity matrix and trim
        method using xView algorithm.

        Args:
            similarity_matrix: The similarity matrix between detections and ground truths : dimension (#detection, #gt)

        Returns:
            ndarray: A binary matrix of all matches of dimension (#detections, #ground truth)

        """
        # We prepare the detection match matrix
        match_matrix = np.zeros_like(similarity_matrix)

        if similarity_matches.shape[1] == 0:  # No matches at all
            return match_matrix

        ground_truth_match_vector = [0] * similarity_matrix.shape[1]

        forward = {match[0, 0]: match[1, :]
                   for match in np.hsplit(similarity_matches, np.where(np.diff(similarity_matches[0, :]) != 0)[0] + 1)}

        for k in range(similarity_matrix.shape[0]):
            # For each detection we select its ground truth match
            detection_matches = forward.get(k, np.zeros((0, 0)))

            # If we don't have anything left to match -> skip
            if detection_matches.size == 0:
                continue

            # We select the biggest similarity_matrix over them
            m = np.argmax(similarity_matrix[k, detection_matches])
            n = detection_matches[m]

            if ground_truth_match_vector[n] == 0:
                # We match the detection and the ground truth
                ground_truth_match_vector[n] = 1
                match_matrix[k, n] = 1

        return match_matrix

    @staticmethod
    def _non_unitary_match(similarity_matrix, similarity_matches):  # noqa: D205,D400
        r"""Match detections bounding boxes with ground truth bounding boxes for a given similarity matrix for every
        positive example yielded by the  trim method.

        Args:
            similarity_matrix: The similarity matrix between detections and ground truths : dimension (#detection, #gt)

        Returns:
            ndarray: A binary matrix of all matches of dimension (#detections, #ground truth)

        """
        # We prepare the detection match matrix
        match_matrix = np.zeros_like(similarity_matrix)
        match_matrix[similarity_matches[0, :], similarity_matches[1, :]] = 1

        return match_matrix


[docs]class MatchEngineIoU(MatchEngineBase):
    """Match detection with their ground truth according the their IoU and the detection confidence score.

    Args:
        threshold (float): The IoU threshold at which one considers a potential match as valid
        match_algorithm (str) : Either 'coco', 'xview' or 'non-unitary' to choose the match algorithm

    """

    def __init__(self, threshold, match_algorithm):
        super(MatchEngineIoU, self).__init__(match_algorithm)

        self._detection_types = (GeometryType.POLYGON, )
        self._ground_truth_types = (GeometryType.POLYGON, )

        self.threshold = threshold

[docs]    def compute_similarity_matrix(self, detections, ground_truths, label_mean_area=None):
        r"""Compute the iou scores between all pairs of geometries with an Rtree on detections to speed up computation.

        Args:
            detections (ndarray, list) : A ndarray of detections stored as:

                * Bounding boxes for a given class where each row is a detection stored as:
                  ``[BoundingBox, confidence]``
                * Polygons for a given class where each row is a detection stored as:
                  ``[Polygon, confidence]``

            ground_truths (ndarray,list) : A ndarray of ground truth stored as:

                * Bounding boxes for a given class where each row is a ground truth stored as:
                  ``[BoundingBox]``
                * Polygons for a given class where each row is a ground truth stored as:
                  ``[Polygon]``

            label_mean_area (float) : Optional, default to ``None``. The mean area for each label in the dataset,
                if given, it is used to match with *iIoU* instead of *IoU* (c.f. :ref:`iiou`)

        Returns:
            ndarray : An IoU matrix (#detections, #ground truth)

        """
        detections = self._sort_detection_by_confidence(detections)
        iou = intersection_over_union(detections[:, 0], ground_truths[:, 0])
        if label_mean_area is not None:
            iou = (label_mean_area / area(ground_truths[:, 0])) * iou

        return iou

[docs]    def trim_similarity_matrix(self, similarity_matrix, detections, ground_truths, label_mean_area=None):
        r"""Compute an array containing the indices in columns of similarity passing the first trimming.

        Here this is the result of a simple thresholding over IoU.

        Args:
            similarity_matrix: The similarity matrix between detections and ground truths : dimension (#detection, #gt)
            detections (ndarray, list) : A ndarray of detections stored as:

                * Bounding boxes for a given class where each row is a detection stored as:
                  ``[BoundingBox, confidence]``
                * Polygons for a given class where each row is a detection stored as:
                  ``[Polygon, confidence]``

            ground_truths (ndarray,list) : A ndarray of ground truth stored as:

                * Bounding boxes for a given class where each row is a ground truth stored as:
                  ``[BoundingBox]``
                * Polygons for a given class where each row is a ground truth stored as:
                  ``[Polygon]``

            label_mean_area (float) : Optional, default to ``None``. The mean area for each label in the dataset,
                if given, it is used to match with *iIoU* instead of *IoU* (c.f. :ref:`iiou`)

        Returns:
            ndarray: An array of dimension (2, N) where each column is a tuple (detection, ground truth) describing
            a potential match. To be more precise, each match-tuple in the array corresponds to a position in the
            similarity matrix which will be used by the match algorithm to compute the final match.

        """
        res = np.stack(np.nonzero(similarity_matrix >= self.threshold))
        return res[:, np.argsort(np.nonzero(similarity_matrix >= self.threshold)[0])]


[docs]class MatchEngineEuclideanDistance(MatchEngineBase):
    """Match detection with their ground truth according the their relative distance and the detection confidence score.

    Args:
        threshold (float): The distance threshold at which one considers a potential match as valid
        match_algorithm (str) : Either 'coco', 'xview' or 'non-unitary' to choose the match algorithm

    """

    def __init__(self, threshold, match_algorithm):
        super(MatchEngineEuclideanDistance, self).__init__(match_algorithm)
        self._threshold = 1 - threshold

    @property
    def threshold(self):
        """float: The distance threshold at which one considers a potential match as valid."""
        return 1 - self._threshold

[docs]    def compute_similarity_matrix(self, detections, ground_truths, label_mean_area=None):
        r"""Compute a partial similarity matrix based on the euclidean distance between all pairs of points.

        The difference with :class:`~playground_metrics.match_detections.MatchEnginePointInBox` lies in the
        similarity matrix rough trimming which depends on a threshold rather than on whether a detection (as a point)
        lies within a ground truth polygon (or bounding box).

        The computed matrix is :math:`\mathcal{S} = 1 - \mathcal{D}` with:

        .. math::

            \mathcal{D}_{ij} = \begin{cases} \left\lVert d_i - gt_i \right\rVert_2 &\mbox{if } d_i \in B(gt_i, t)\\
                \inf &\mbox{if }  d_i \notin B(gt_i, t) \end{cases}

        Where :math:`B(gt_i, t)` is a square box centered in :math:`gt_i` of size length :math:`t`.

        Args:
            detections (ndarray, list) : A ndarray of detections stored as:

                * Bounding boxes for a given class where each row is a detection stored as:
                  ``[BoundingBox, confidence]``
                * Polygons for a given class where each row is a detection stored as:
                  ``[Polygon, confidence]``
                * Points for a given class where each row is a detection stored as:
                  ``[Point, confidence]``

            ground_truths (ndarray,list) : A ndarray of ground truth stored as:

                * Bounding boxes for a given class where each row is a ground truth stored as:
                  ``[BoundingBox]``
                * Polygons for a given class where each row is a ground truth stored as:
                  ``[Polygon]``
                * Points for a given class where each row is a ground truth stored as:
                  ``[Point]``

            label_mean_area (float) : Optional, default to ``None``. The mean area for each label in the dataset.

        Returns:
            ndarray : An similarity matrix (#detections, #ground truth)

        """
        detections = self._sort_detection_by_confidence(detections)
        similarity = euclidean_distance(as_points(detections[:, 0]),
                                        point_to_box(ground_truths[:, 0],
                                                     width=2 * self.threshold,
                                                     height=2 * self.threshold))
        return similarity

[docs]    def trim_similarity_matrix(self, similarity_matrix, detections, ground_truths, label_mean_area=None):
        r"""Compute an array containing the indices in columns of similarity passing the first trimming.

        Here this is the result of a simple thresholding over the distance matrix.

        Args:
            similarity_matrix: The similarity matrix between detections and ground truths : dimension (#detection, #gt)
            detections (ndarray, list) : A ndarray of detections stored as:

                * Bounding boxes for a given class where each row is a detection stored as:
                  ``[BoundingBox, confidence]``
                * Polygons for a given class where each row is a detection stored as:
                  ``[Polygon, confidence]``
                * Points for a given class where each row is a detection stored as:
                  ``[Point, confidence]``

            ground_truths (ndarray,list) : A ndarray of ground truth stored as:

                * Bounding boxes for a given class where each row is a ground truth stored as:
                  ``[BoundingBox]``
                * Polygons for a given class where each row is a ground truth stored as:
                  ``[Polygon]``
                * Points for a given class where each row is a ground truth stored as:
                  ``[Point]``

            label_mean_area (float) : Optional, default to ``None``. The mean area for each label in the dataset.

        Returns:
            ndarray: An array of dimension (2, N) where each column is a tuple (detection, ground truth) describing
            a potential match. To be more precise, each match-tuple in the array corresponds to a position in the
            similarity matrix which will be used by the match algorithm to compute the final match.

        """
        res = np.stack(np.nonzero(similarity_matrix >= self._threshold))
        return res[:, np.argsort(np.nonzero(similarity_matrix >= self._threshold)[0])]


[docs]class MatchEnginePointInBox(MatchEngineBase):  # noqa: D205,D400
    """Match detection with their ground truth according the their relative distance, whether a detection point is in a
    ground truth box and the detection confidence score.

    Args:
        match_algorithm (str) : Either 'coco', 'xview' or 'non-unitary' to choose the match algorithm

    """

    def __init__(self, match_algorithm):
        super(MatchEnginePointInBox, self).__init__(match_algorithm)

        self._ground_truth_types = (GeometryType.POLYGON, )

[docs]    def compute_similarity_matrix(self, detections, ground_truths, label_mean_area=None):  # noqa: D205,D400
        r"""Compute a partial similarity matrix based on the euclidean distance between all pairs of points with an
        Rtree on detections to speed up computation.

        The difference with :class:`~playground_metrics.match_detections.MatchEngineEuclideanDistance` lies in the
        similarity matrix rough trimming which depends on whether a detection (as a point) lies within a ground truth
        polygon (or bounding box) rather than on a threshold.

        The computed matrix is :math:`\mathcal{S} = 1 - \mathcal{D}` with:

        .. math::

            \mathcal{D}_{ij} = \left\lVert d_i - gt_i \right\rVert_2

        Args:
            detections (ndarray, list) : A ndarray of detections stored as:

                * Bounding boxes for a given class where each row is a detection stored as:
                  ``[BoundingBox, confidence]``
                * Polygons for a given class where each row is a detection stored as:
                  ``[Polygon, confidence]``
                * Points for a given class where each row is a detection stored as:
                  ``[Point, confidence]``

            ground_truths (ndarray,list) : A ndarray of ground truth stored as:

                * Bounding boxes for a given class where each row is a ground truth stored as:
                  ``[BoundingBox]``
                * Polygons for a given class where each row is a ground truth stored as:
                  ``[Polygon]``

            label_mean_area (float) : Optional, default to ``None``. The mean area for each label in the dataset.

        Returns:
            ndarray : An similarity matrix (#detections, #ground truth)

        """
        detections = self._sort_detection_by_confidence(detections)
        similarity = euclidean_distance(as_points(detections[:, 0]),
                                        as_boxes(ground_truths[:, 0]))
        return similarity

[docs]    def trim_similarity_matrix(self, similarity_matrix, detections, ground_truths, label_mean_area=None):
        r"""Compute an array containing the indices in columns of similarity passing the first trimming.

        Here a detection/ground truth pair is kept if the detection
        :class:`~playground_metrics.utils.geometry_utils.geometry.Point` is within the ground truth
        :class:`~playground_metrics.utils.geometry_utils.geometry.BoundingBox` or
        :class:`~playground_metrics.utils.geometry_utils.geometry.Polygon`

        Args:
            similarity_matrix: The similarity matrix between detections and ground truths : dimension (#detection, #gt)
            detections (ndarray, list) : A ndarray of detections stored as:

                * Bounding boxes for a given class where each row is a detection stored as:
                  ``[BoundingBox, confidence]``
                * Polygons for a given class where each row is a detection stored as:
                  ``[Polygon, confidence]``
                * Points for a given class where each row is a detection stored as:
                  ``[Point, confidence]``

            ground_truths (ndarray,list) : A ndarray of ground truth stored as:

                * Bounding boxes for a given class where each row is a ground truth stored as:
                  ``[BoundingBox]``
                * Polygons for a given class where each row is a ground truth stored as:
                  ``[Polygon]``

            label_mean_area (float) : Optional, default to ``None``. The mean area for each label in the dataset.

        Returns:
            ndarray: An array of dimension (2, N) where each column is a tuple (detection, ground truth) describing
            a potential match. To be more precise, each match-tuple in the array corresponds to a position in the
            similarity matrix which will be used by the match algorithm to compute the final match.

        """
        potential = np.stack(np.nonzero(similarity_matrix != -np.Inf))
        potential = potential[:, np.argsort(np.nonzero(similarity_matrix != -np.Inf)[0])]

        trim = []
        for i in range(potential.shape[1]):
            r, c = potential[:, i]
            if np.all(is_empty(intersection(detections[r, 0], ground_truths[c, 0]))):
                trim.append(i)

        return np.delete(potential, trim, axis=1)


[docs]class MatchEngineConstantBox(MatchEngineIoU):  # noqa: D205,D400
    """Match detection with their ground truth according the IoU computed on fixed-size
    bounding boxes around detection and ground truth points and the detection confidence score.

    Args:
        threshold (float): The IoU threshold at which one considers a potential match as valid
        match_algorithm (str) : Either 'coco', 'xview' or 'non-unitary' to choose the match algorithm
        bounding_box_size (float): The fixed-size bounding box size

    """

    def __init__(self, threshold, match_algorithm, bounding_box_size):
        super(MatchEngineConstantBox, self).__init__(threshold, match_algorithm)
        self.bounding_box_size = bounding_box_size

        # Override authorized geometric types fot this match engine
        self._detection_types = (GeometryType.POLYGON, GeometryType.POINT)
        self._ground_truth_types = (GeometryType.POLYGON, GeometryType.POINT)

[docs]    def compute_similarity_matrix(self, detections, ground_truths, label_mean_area=None):  # noqa: D205,D400
        r"""Compute a parial similarity matrix based on the intersection-over-union between all pairs of constant-sized
        bounding box around points with an Rtree on detections to speed up computation.

        Args:
            detections (ndarray, list) : A ndarray of detections stored as:

                * Bounding boxes for a given class where each row is a detection stored as:
                  ``[BoundingBox, confidence]``
                * Polygons for a given class where each row is a detection stored as:
                  ``[Polygon, confidence]``
                * Points for a given class where each row is a detection stored as:
                  ``[Point, confidence]``

            ground_truths (ndarray,list) : A ndarray of ground truth stored as:

                * Bounding boxes for a given class where each row is a ground truth stored as:
                  ``[BoundingBox]``
                * Polygons for a given class where each row is a ground truth stored as:
                  ``[Polygon]``
                * Points for a given class where each row is a ground truth stored as:
                  ``[Point]``

            label_mean_area (float) : Optional, default to ``None``. The mean area for each label in the dataset.

        Returns:
            ndarray : An IoU matrix (#detections, #ground truth)

        """
        detections = np.stack((point_to_box(detections[:, 0],
                                            width=self.bounding_box_size,
                                            height=self.bounding_box_size),
                               detections[:, 1]), axis=1)
        ground_truths = point_to_box(ground_truths[:, 0],
                                     width=self.bounding_box_size,
                                     height=self.bounding_box_size)[:, None]

        return super(MatchEngineConstantBox, self).compute_similarity_matrix(detections,
                                                                             ground_truths,
                                                                             label_mean_area)