mean_average_precision

COCO Mean average precisin (mAP) implementation.

`MeanAveragePrecision` ¶

Bases: Trace

Calculate COCO mean average precision.

Parameters:

Name	Type	Description	Default
`num_classes`	`int`	Maximum `int` value for your class label. In COCO dataset we only used 80 classes, but the maxium value of the class label is `90`. In this case `num_classes` should be `90`.	required

Returns:

Type	Description
	Mean Average Precision.

Source code in fastestimator\fastestimator\trace\metric\mean_average_precision.py

class MeanAveragePrecision(Trace):
    """Calculate COCO mean average precision.

    Args:
        num_classes: Maximum `int` value for your class label. In COCO dataset we only used 80 classes, but the maxium
            value of the class label is `90`. In this case `num_classes` should be `90`.

    Returns:
        Mean Average Precision.
    """
    def __init__(self,
                 num_classes: int,
                 true_key='bbox',
                 pred_key: str = 'pred',
                 mode: str = "eval",
                 output_name=("mAP", "AP50", "AP75")) -> None:
        super().__init__(inputs=(true_key, pred_key), outputs=output_name, mode=mode)

        assert len(self.outputs) == 3, 'MeanAvgPrecision trace adds 3 fields mAP AP50 AP75 to state dict'

        self.iou_thres = np.linspace(.5, 0.95, np.round((0.95 - .5) / .05).astype(np.int) + 1, endpoint=True)
        self.recall_thres = np.linspace(.0, 1.00, np.round((1.00 - .0) / .01).astype(np.int) + 1, endpoint=True)
        self.categories = range(1, num_classes + 1)  # MSCOCO style class label starts from 1
        self.max_detection = 100
        self.image_ids = []

        # eval
        self.evalimgs = {}
        self.eval = {}
        self.ids_in_epoch = 0  # reset per epoch

        # reset per batch
        self.gt = defaultdict(list)  # gt for evaluation
        self.det = defaultdict(list)
        self.batch_image_ids = []  # img_ids per batch
        self.ious = defaultdict(list)
        self.ids_unique = []
        self.ids_batch_to_epoch = {}
        self.counter = 0  # REMOVE

    @property
    def true_key(self) -> str:
        return self.inputs[0]

    @property
    def pred_key(self) -> str:
        return self.inputs[1]

    def _get_id_in_epoch(self, idx_in_batch: int) -> int:
        """Get unique image id in epoch.

        Id starts from 1.

        Args:
            idx_in_batch: Image id within a batch.

        Returns:
            Global unique id within one epoch.
        """
        # for this batch
        num_unique_id_previous = len(np.unique(self.ids_unique))
        self.ids_unique.append(idx_in_batch)
        num_unique_id = len(np.unique(self.ids_unique))

        if num_unique_id > num_unique_id_previous:
            # for epoch
            self.ids_in_epoch += 1
            self.ids_batch_to_epoch[idx_in_batch] = self.ids_in_epoch
        return self.ids_in_epoch

    def on_epoch_begin(self, data: Data):
        """Reset instance variables."""
        self.image_ids = []  # append all the image ids coming from each iteration
        self.evalimgs = {}
        self.eval = {}
        self.ids_in_epoch = 0

    def on_batch_begin(self, data: Data):
        """Reset instance variables."""
        self.gt = defaultdict(list)  # gt for evaluation
        self.det = defaultdict(list)  # det for evaluation
        self.batch_image_ids = []  # img_ids per batch

        self.ious = defaultdict(list)
        self.ids_unique = []
        self.ids_batch_to_epoch = {}

    @staticmethod
    def _reshape_gt(gt_array: np.ndarray) -> np.ndarray:
        """Reshape ground truth and add local image id within batch.

        The input ground truth array has shape (batch_size, num_bbox, 5). The 5 is [x1, y1, w, h, label] for each
        bounding box.
        For output we drop all padded bounding boxes (all zeros), and flatten the batch dimension. The output shape is
        (batch_size * num_bbox, 6). The 6 is [id_in_batch, x1, y1, w, h, label].

        Args:
            gt_array: Ground truth with shape (batch_size, num_bbox, 5).

        Returns:
            Ground truth with shape (batch_size * num_bbox, 6).
        """
        local_ids = np.repeat(range(gt_array.shape[0]), gt_array.shape[1], axis=None)
        local_ids = np.expand_dims(local_ids, axis=-1)

        gt_with_id = np.concatenate([local_ids, gt_array.reshape(-1, 5)], axis=1)
        keep = gt_with_id[..., -1] > 0

        return gt_with_id[keep]

    @staticmethod
    def _reshape_pred(pred: List[np.ndarray]) -> np.ndarray:
        """Reshape predicted bounding boxes and add local image id within batch.

        The input prediction array is a list of batch_size elements. For each element inside the list, it
        has shape (num_bbox, 6). The 6 is [x1, y1, w, h, label, score] for each bounding box.
        For output we flatten the batch dimension. The output shape is (total_num_bbox_in_batch, 7). The 7 is
        [id_in_batch, x1, y1, w, h, label, score].

        Args:
            pred: List of predected bounding boxes for each image. Each element in the list has shape (num_bbox, 6).

        Returns:
            Predected bounding boxes with shape (total_num_bbox_in_batch, 7).
        """
        pred_with_id = []
        for index, item in enumerate(pred):
            local_ids = np.repeat([index], item.shape[0], axis=None)
            local_ids = np.expand_dims(local_ids, axis=-1)
            pred_with_id.append(np.concatenate([local_ids, item], axis=1))

        pred_with_id = np.concatenate(pred_with_id, axis=0)
        return pred_with_id

    def on_batch_end(self, data: Data):
        # begin of reading det and gt
        pred = list(map(to_number, data[self.pred_key]))  # pred is list (batch, ) of np.ndarray (?, 6)
        pred = self._reshape_pred(pred)

        gt = to_number(data[self.true_key])  # gt is np.array (batch, box, 5), box dimension is padded
        gt = self._reshape_gt(gt)

        ground_truth_bb = []
        for gt_item in gt:
            idx_in_batch, x1, y1, w, h, label = gt_item
            label = int(label)
            id_epoch = self._get_id_in_epoch(idx_in_batch)
            self.batch_image_ids.append(id_epoch)
            self.image_ids.append(id_epoch)
            tmp_dict = {'idx': id_epoch, 'x1': x1, 'y1': y1, 'w': w, 'h': h, 'label': label}
            ground_truth_bb.append(tmp_dict)

        predicted_bb = []
        for pred_item in pred:
            idx_in_batch, x1, y1, w, h, label, score = pred_item
            label = int(label)
            id_epoch = self.ids_batch_to_epoch[idx_in_batch]
            self.image_ids.append(id_epoch)
            tmp_dict = {'idx': id_epoch, 'x1': x1, 'y1': y1, 'w': w, 'h': h, 'label': label, 'score': score}
            predicted_bb.append(tmp_dict)

        for dict_elem in ground_truth_bb:
            self.gt[dict_elem['idx'], dict_elem['label']].append(dict_elem)

        for dict_elem in predicted_bb:
            self.det[dict_elem['idx'], dict_elem['label']].append(dict_elem)
        # end of reading det and gt

        # compute iou matrix, matrix index is (img_id, cat_id), each element in matrix has shape (num_det, num_gt)
        self.ious = {(img_id, cat_id): self.compute_iou(self.det[img_id, cat_id], self.gt[img_id, cat_id])
                     for img_id in self.batch_image_ids for cat_id in self.categories}

        for cat_id in self.categories:
            for img_id in self.batch_image_ids:
                self.evalimgs[(cat_id, img_id)] = self.evaluate_img(cat_id, img_id)

    def on_epoch_end(self, data: Data):
        self.accumulate()

        mean_ap = self.summarize()
        ap50 = self.summarize(iou=0.5)
        ap75 = self.summarize(iou=0.75)

        data[self.outputs[0]] = mean_ap
        data[self.outputs[1]] = ap50
        data[self.outputs[2]] = ap75

    def evaluate_img(self, cat_id: int, img_id: int) -> Dict:
        """Find gt matches for det given one image and one category.

        Args:
            cat_id:
            img_id:

        Returns:

        """
        det = self.det[img_id, cat_id]
        gt = self.gt[img_id, cat_id]

        num_det = len(det)
        num_gt = len(gt)

        if num_gt == 0 and num_det == 0:
            return None

        # sort detections, is ths necessary?
        det_index = np.argsort([-d['score'] for d in det], kind='mergesort')

        # cap to max_detection
        det = [det[i] for i in det_index[0:self.max_detection]]

        # get iou matrix for given (img_id, cat_id), the output has shape (num_det, num_gt)
        iou_mat = self.ious[img_id, cat_id]

        num_iou_thresh = len(self.iou_thres)

        det_match = np.zeros((num_iou_thresh, num_det))
        gt_match = np.zeros((num_iou_thresh, num_gt))

        if len(iou_mat) != 0:
            # loop through each iou thresh
            for thres_idx, thres_value in enumerate(self.iou_thres):
                # loop through each detection, for each detection, match only one gt
                for det_idx, _ in enumerate(det):
                    m = -1
                    iou_threshold = min([thres_value, 1 - 1e-10])
                    # loop through each gt, find the gt gives max iou
                    for gt_idx, _ in enumerate(gt):
                        if gt_match[thres_idx, gt_idx] > 0:
                            continue
                        if iou_mat[det_idx, gt_idx] >= iou_threshold:
                            iou_threshold = iou_mat[det_idx, gt_idx]
                            m = gt_idx

                    if m != -1:
                        det_match[thres_idx, det_idx] = gt[m]['idx']
                        gt_match[thres_idx, m] = 1

        return {
            'image_id': img_id,
            'category_id': cat_id,
            'gtIds': [g['idx'] for g in gt],
            'dtMatches': det_match,  # shape (num_iou_thresh, num_det), value is zero or GT index
            'gtMatches': gt_match,  # shape (num_iou_thresh, num_gt), value 1 or zero
            'dtScores': [d['score'] for d in det],
            'num_gt': num_gt,
        }

    def accumulate(self) -> None:
        """Generate precision-recall curve."""
        key_list = sorted(self.evalimgs)  # key format (cat_id, img_id)
        eval_list = [self.evalimgs[key] for key in key_list]

        self.image_ids = np.unique(self.image_ids)

        num_iou_thresh = len(self.iou_thres)
        num_recall_thresh = len(self.recall_thres)
        num_categories = len(self.categories)
        cat_list_zeroidx = [n for n, cat in enumerate(self.categories)]

        num_imgs = len(self.image_ids)
        maxdets = self.max_detection

        # initialize these at -1
        precision_matrix = -np.ones((num_iou_thresh, num_recall_thresh, num_categories))
        recall_matrix = -np.ones((num_iou_thresh, num_categories))
        scores_matrix = -np.ones((num_iou_thresh, num_recall_thresh, num_categories))

        # loop through category
        for cat_index in cat_list_zeroidx:
            Nk = cat_index * num_imgs
            # each element is one image inside this category
            eval_by_category = [eval_list[Nk + img_idx] for img_idx in range(num_imgs)]
            # drop None
            eval_by_category = [e for e in eval_by_category if not e is None]

            # no image inside this category
            if len(eval_by_category) == 0:
                continue

            det_scores = np.concatenate([e['dtScores'][0:maxdets] for e in eval_by_category])
            # sort from high score to low score, is this necessary?
            sorted_score_inds = np.argsort(-det_scores, kind='mergesort')

            det_scores_sorted = det_scores[sorted_score_inds]
            det_match = np.concatenate([e['dtMatches'][:, 0:maxdets] for e in eval_by_category],
                                       axis=1)[:, sorted_score_inds]  # shape (num_iou_thresh, num_det_all_images)
            # number of all image gts in one category
            num_all_gt = np.sum([e['num_gt'] for e in eval_by_category])
            # for all images no gt inside this category
            if num_all_gt == 0:
                continue

            tps = det_match > 0
            fps = det_match == 0

            tp_sum = np.cumsum(tps, axis=1).astype(dtype=np.float)
            fp_sum = np.cumsum(fps, axis=1).astype(dtype=np.float)

            for index, (true_positives, false_positives) in enumerate(zip(tp_sum, fp_sum)):
                true_positives = np.array(true_positives)
                false_positives = np.array(false_positives)
                nd = len(true_positives)
                recall = true_positives / num_all_gt
                precision = true_positives / (false_positives + true_positives + np.spacing(1))

                precision_at_recall = np.zeros((num_recall_thresh, ))
                score = np.zeros((num_recall_thresh, ))

                if nd:
                    recall_matrix[index, cat_index] = recall[-1]
                else:
                    recall_matrix[index, cat_index] = 0

                precision = precision.tolist()
                precision_at_recall = precision_at_recall.tolist()

                # smooth precision along the curve, remove zigzag
                for i in range(nd - 1, 0, -1):
                    if precision[i] > precision[i - 1]:
                        precision[i - 1] = precision[i]

                inds = np.searchsorted(recall, self.recall_thres, side='left')

                try:
                    for recall_index, precision_index in enumerate(inds):
                        precision_at_recall[recall_index] = precision[precision_index]
                        score[recall_index] = det_scores_sorted[precision_index]
                except:
                    pass

                precision_matrix[index, :, cat_index] = np.array(precision_at_recall)
                scores_matrix[index, :, cat_index] = np.array(score)

        self.eval = {
            'counts': [num_iou_thresh, num_recall_thresh, num_categories],
            'precision': precision_matrix,
            'recall': recall_matrix,
            'scores': scores_matrix,
        }

    def summarize(self, iou: float = None) -> float:
        """Compute average precision given one intersection union threshold.

        Args:
            iou: Intersection over union threshold. If this value is `None`, then average all iou thresholds. The result
                is the mean average precision.

        Returns:
            Average precision.
        """
        precision_at_iou = self.eval['precision']  # shape (num_iou_thresh, num_recall_thresh, num_categories)
        if iou is not None:
            iou_thresh_index = np.where(iou == self.iou_thres)[0]
            precision_at_iou = precision_at_iou[iou_thresh_index]

        precision_at_iou = precision_at_iou[:, :, :]

        if len(precision_at_iou[precision_at_iou > -1]) == 0:
            mean_ap = -1
        else:
            mean_ap = np.mean(precision_at_iou[precision_at_iou > -1])

        return mean_ap

    def compute_iou(self, det: np.ndarray, gt: np.ndarray) -> np.ndarray:
        """Compute intersection over union.

        We leverage `maskUtils.iou`.

        Args:
            det: Detection array.
            gt: Ground truth array.

        Returns:
            Intersection of union array.
        """
        num_dt = len(det)
        num_gt = len(gt)

        if num_gt == 0 and num_dt == 0:
            return []

        boxes_a = np.zeros(shape=(0, 4), dtype=float)
        boxes_b = np.zeros(shape=(0, 4), dtype=float)

        inds = np.argsort([-d['score'] for d in det], kind='mergesort')
        det = [det[i] for i in inds]
        if len(det) > self.max_detection:
            det = det[0:self.max_detection]

        boxes_a = [[dt_elem['x1'], dt_elem['y1'], dt_elem['w'], dt_elem['h']] for dt_elem in det]
        boxes_b = [[gt_elem['x1'], gt_elem['y1'], gt_elem['w'], gt_elem['h']] for gt_elem in gt]

        iscrowd = [0] * num_gt  # to leverage maskUtils.iou
        iou_dt_gt = maskUtils.iou(boxes_a, boxes_b, iscrowd)
        return iou_dt_gt

`accumulate` ¶

Generate precision-recall curve.

Source code in fastestimator\fastestimator\trace\metric\mean_average_precision.py

def accumulate(self) -> None:
    """Generate precision-recall curve."""
    key_list = sorted(self.evalimgs)  # key format (cat_id, img_id)
    eval_list = [self.evalimgs[key] for key in key_list]

    self.image_ids = np.unique(self.image_ids)

    num_iou_thresh = len(self.iou_thres)
    num_recall_thresh = len(self.recall_thres)
    num_categories = len(self.categories)
    cat_list_zeroidx = [n for n, cat in enumerate(self.categories)]

    num_imgs = len(self.image_ids)
    maxdets = self.max_detection

    # initialize these at -1
    precision_matrix = -np.ones((num_iou_thresh, num_recall_thresh, num_categories))
    recall_matrix = -np.ones((num_iou_thresh, num_categories))
    scores_matrix = -np.ones((num_iou_thresh, num_recall_thresh, num_categories))

    # loop through category
    for cat_index in cat_list_zeroidx:
        Nk = cat_index * num_imgs
        # each element is one image inside this category
        eval_by_category = [eval_list[Nk + img_idx] for img_idx in range(num_imgs)]
        # drop None
        eval_by_category = [e for e in eval_by_category if not e is None]

        # no image inside this category
        if len(eval_by_category) == 0:
            continue

        det_scores = np.concatenate([e['dtScores'][0:maxdets] for e in eval_by_category])
        # sort from high score to low score, is this necessary?
        sorted_score_inds = np.argsort(-det_scores, kind='mergesort')

        det_scores_sorted = det_scores[sorted_score_inds]
        det_match = np.concatenate([e['dtMatches'][:, 0:maxdets] for e in eval_by_category],
                                   axis=1)[:, sorted_score_inds]  # shape (num_iou_thresh, num_det_all_images)
        # number of all image gts in one category
        num_all_gt = np.sum([e['num_gt'] for e in eval_by_category])
        # for all images no gt inside this category
        if num_all_gt == 0:
            continue

        tps = det_match > 0
        fps = det_match == 0

        tp_sum = np.cumsum(tps, axis=1).astype(dtype=np.float)
        fp_sum = np.cumsum(fps, axis=1).astype(dtype=np.float)

        for index, (true_positives, false_positives) in enumerate(zip(tp_sum, fp_sum)):
            true_positives = np.array(true_positives)
            false_positives = np.array(false_positives)
            nd = len(true_positives)
            recall = true_positives / num_all_gt
            precision = true_positives / (false_positives + true_positives + np.spacing(1))

            precision_at_recall = np.zeros((num_recall_thresh, ))
            score = np.zeros((num_recall_thresh, ))

            if nd:
                recall_matrix[index, cat_index] = recall[-1]
            else:
                recall_matrix[index, cat_index] = 0

            precision = precision.tolist()
            precision_at_recall = precision_at_recall.tolist()

            # smooth precision along the curve, remove zigzag
            for i in range(nd - 1, 0, -1):
                if precision[i] > precision[i - 1]:
                    precision[i - 1] = precision[i]

            inds = np.searchsorted(recall, self.recall_thres, side='left')

            try:
                for recall_index, precision_index in enumerate(inds):
                    precision_at_recall[recall_index] = precision[precision_index]
                    score[recall_index] = det_scores_sorted[precision_index]
            except:
                pass

            precision_matrix[index, :, cat_index] = np.array(precision_at_recall)
            scores_matrix[index, :, cat_index] = np.array(score)

    self.eval = {
        'counts': [num_iou_thresh, num_recall_thresh, num_categories],
        'precision': precision_matrix,
        'recall': recall_matrix,
        'scores': scores_matrix,
    }

`compute_iou` ¶

Compute intersection over union.

We leverage maskUtils.iou.

Parameters:

Name	Type	Description	Default
`det`	`np.ndarray`	Detection array.	required
`gt`	`np.ndarray`	Ground truth array.	required

Returns:

Type	Description
`np.ndarray`	Intersection of union array.

Source code in fastestimator\fastestimator\trace\metric\mean_average_precision.py

def compute_iou(self, det: np.ndarray, gt: np.ndarray) -> np.ndarray:
    """Compute intersection over union.

    We leverage `maskUtils.iou`.

    Args:
        det: Detection array.
        gt: Ground truth array.

    Returns:
        Intersection of union array.
    """
    num_dt = len(det)
    num_gt = len(gt)

    if num_gt == 0 and num_dt == 0:
        return []

    boxes_a = np.zeros(shape=(0, 4), dtype=float)
    boxes_b = np.zeros(shape=(0, 4), dtype=float)

    inds = np.argsort([-d['score'] for d in det], kind='mergesort')
    det = [det[i] for i in inds]
    if len(det) > self.max_detection:
        det = det[0:self.max_detection]

    boxes_a = [[dt_elem['x1'], dt_elem['y1'], dt_elem['w'], dt_elem['h']] for dt_elem in det]
    boxes_b = [[gt_elem['x1'], gt_elem['y1'], gt_elem['w'], gt_elem['h']] for gt_elem in gt]

    iscrowd = [0] * num_gt  # to leverage maskUtils.iou
    iou_dt_gt = maskUtils.iou(boxes_a, boxes_b, iscrowd)
    return iou_dt_gt

`evaluate_img` ¶

Find gt matches for det given one image and one category.

Parameters:

Name	Type	Description	Default
`cat_id`	`int`		required
`img_id`	`int`		required

Source code in fastestimator\fastestimator\trace\metric\mean_average_precision.py

def evaluate_img(self, cat_id: int, img_id: int) -> Dict:
    """Find gt matches for det given one image and one category.

    Args:
        cat_id:
        img_id:

    Returns:

    """
    det = self.det[img_id, cat_id]
    gt = self.gt[img_id, cat_id]

    num_det = len(det)
    num_gt = len(gt)

    if num_gt == 0 and num_det == 0:
        return None

    # sort detections, is ths necessary?
    det_index = np.argsort([-d['score'] for d in det], kind='mergesort')

    # cap to max_detection
    det = [det[i] for i in det_index[0:self.max_detection]]

    # get iou matrix for given (img_id, cat_id), the output has shape (num_det, num_gt)
    iou_mat = self.ious[img_id, cat_id]

    num_iou_thresh = len(self.iou_thres)

    det_match = np.zeros((num_iou_thresh, num_det))
    gt_match = np.zeros((num_iou_thresh, num_gt))

    if len(iou_mat) != 0:
        # loop through each iou thresh
        for thres_idx, thres_value in enumerate(self.iou_thres):
            # loop through each detection, for each detection, match only one gt
            for det_idx, _ in enumerate(det):
                m = -1
                iou_threshold = min([thres_value, 1 - 1e-10])
                # loop through each gt, find the gt gives max iou
                for gt_idx, _ in enumerate(gt):
                    if gt_match[thres_idx, gt_idx] > 0:
                        continue
                    if iou_mat[det_idx, gt_idx] >= iou_threshold:
                        iou_threshold = iou_mat[det_idx, gt_idx]
                        m = gt_idx

                if m != -1:
                    det_match[thres_idx, det_idx] = gt[m]['idx']
                    gt_match[thres_idx, m] = 1

    return {
        'image_id': img_id,
        'category_id': cat_id,
        'gtIds': [g['idx'] for g in gt],
        'dtMatches': det_match,  # shape (num_iou_thresh, num_det), value is zero or GT index
        'gtMatches': gt_match,  # shape (num_iou_thresh, num_gt), value 1 or zero
        'dtScores': [d['score'] for d in det],
        'num_gt': num_gt,
    }

`on_batch_begin` ¶

Reset instance variables.

Source code in fastestimator\fastestimator\trace\metric\mean_average_precision.py

def on_batch_begin(self, data: Data):
    """Reset instance variables."""
    self.gt = defaultdict(list)  # gt for evaluation
    self.det = defaultdict(list)  # det for evaluation
    self.batch_image_ids = []  # img_ids per batch

    self.ious = defaultdict(list)
    self.ids_unique = []
    self.ids_batch_to_epoch = {}

`on_epoch_begin` ¶

Reset instance variables.

Source code in fastestimator\fastestimator\trace\metric\mean_average_precision.py

def on_epoch_begin(self, data: Data):
    """Reset instance variables."""
    self.image_ids = []  # append all the image ids coming from each iteration
    self.evalimgs = {}
    self.eval = {}
    self.ids_in_epoch = 0

`summarize` ¶

Compute average precision given one intersection union threshold.

Parameters:

Name	Type	Description	Default
`iou`	`float`	Intersection over union threshold. If this value is `None`, then average all iou thresholds. The result is the mean average precision.	`None`

Returns:

Type	Description
`float`	Average precision.

Source code in fastestimator\fastestimator\trace\metric\mean_average_precision.py

def summarize(self, iou: float = None) -> float:
    """Compute average precision given one intersection union threshold.

    Args:
        iou: Intersection over union threshold. If this value is `None`, then average all iou thresholds. The result
            is the mean average precision.

    Returns:
        Average precision.
    """
    precision_at_iou = self.eval['precision']  # shape (num_iou_thresh, num_recall_thresh, num_categories)
    if iou is not None:
        iou_thresh_index = np.where(iou == self.iou_thres)[0]
        precision_at_iou = precision_at_iou[iou_thresh_index]

    precision_at_iou = precision_at_iou[:, :, :]

    if len(precision_at_iou[precision_at_iou > -1]) == 0:
        mean_ap = -1
    else:
        mean_ap = np.mean(precision_at_iou[precision_at_iou > -1])

    return mean_ap

mean_average_precision