From 83d4386fa25e6bd4dd30d1174d5ca111d075b429 Mon Sep 17 00:00:00 2001 From: LinasKo Date: Fri, 8 Nov 2024 00:09:55 +0200 Subject: [PATCH 1/2] Implemented mAR metric --- supervision/metrics/__init__.py | 4 + supervision/metrics/mean_average_recall.py | 512 +++++++++++++++++++++ 2 files changed, 516 insertions(+) create mode 100644 supervision/metrics/mean_average_recall.py diff --git a/supervision/metrics/__init__.py b/supervision/metrics/__init__.py index 90fc17b47..12b243ce6 100644 --- a/supervision/metrics/__init__.py +++ b/supervision/metrics/__init__.py @@ -8,6 +8,10 @@ MeanAveragePrecision, MeanAveragePrecisionResult, ) +from supervision.metrics.mean_average_recall import ( + MeanAverageRecall, + MeanAverageRecallResult, +) from supervision.metrics.precision import Precision, PrecisionResult from supervision.metrics.recall import Recall, RecallResult from supervision.metrics.utils.object_size import ( diff --git a/supervision/metrics/mean_average_recall.py b/supervision/metrics/mean_average_recall.py new file mode 100644 index 000000000..5f0274aec --- /dev/null +++ b/supervision/metrics/mean_average_recall.py @@ -0,0 +1,512 @@ +from __future__ import annotations + +from copy import deepcopy +from dataclasses import dataclass +from typing import TYPE_CHECKING, List, Optional, Tuple, Union + +import numpy as np +from matplotlib import pyplot as plt + +from supervision.config import ORIENTED_BOX_COORDINATES +from supervision.detection.core import Detections +from supervision.detection.utils import ( + box_iou_batch, + mask_iou_batch, + oriented_box_iou_batch, +) +from supervision.draw.color import LEGACY_COLOR_PALETTE +from supervision.metrics.core import Metric, MetricTarget +from supervision.metrics.utils.object_size import ( + ObjectSizeCategory, + get_detection_size_category, +) +from supervision.metrics.utils.utils import ensure_pandas_installed + +if TYPE_CHECKING: + import pandas as pd + + +class MeanAverageRecall(Metric): + def __init__( + self, + metric_target: MetricTarget = MetricTarget.BOXES, + ): + self._metric_target = metric_target + + self._predictions_list: List[Detections] = [] + self._targets_list: List[Detections] = [] + + self.max_detections = np.array([1, 10, 100]) + + def reset(self) -> None: + self._predictions_list = [] + self._targets_list = [] + + def update( + self, + predictions: Union[Detections, List[Detections]], + targets: Union[Detections, List[Detections]], + ) -> MeanAverageRecall: + if not isinstance(predictions, list): + predictions = [predictions] + if not isinstance(targets, list): + targets = [targets] + + if len(predictions) != len(targets): + raise ValueError( + f"The number of predictions ({len(predictions)}) and" + f" targets ({len(targets)}) during the update must be the same." + ) + + self._predictions_list.extend(predictions) + self._targets_list.extend(targets) + + return self + + def compute(self) -> MeanAverageRecallResult: + result = self._compute(self._predictions_list, self._targets_list) + + small_predictions, small_targets = self._filter_predictions_and_targets_by_size( + self._predictions_list, self._targets_list, ObjectSizeCategory.SMALL + ) + result.small_objects = self._compute(small_predictions, small_targets) + + medium_predictions, medium_targets = ( + self._filter_predictions_and_targets_by_size( + self._predictions_list, self._targets_list, ObjectSizeCategory.MEDIUM + ) + ) + result.medium_objects = self._compute(medium_predictions, medium_targets) + + large_predictions, large_targets = self._filter_predictions_and_targets_by_size( + self._predictions_list, self._targets_list, ObjectSizeCategory.LARGE + ) + result.large_objects = self._compute(large_predictions, large_targets) + + return result + + def _compute( + self, predictions_list: List[Detections], targets_list: List[Detections] + ) -> MeanAverageRecallResult: + iou_thresholds = np.linspace(0.5, 0.95, 10) + stats = [] + + for predictions, targets in zip(predictions_list, targets_list): + prediction_contents = self._detections_content(predictions) + target_contents = self._detections_content(targets) + + if len(targets) > 0: + if len(predictions) == 0: + stats.append( + ( + np.zeros((0, iou_thresholds.size), dtype=bool), + np.zeros((0,), dtype=np.float32), + np.zeros((0,), dtype=int), + targets.class_id, + ) + ) + + else: + if self._metric_target == MetricTarget.BOXES: + iou = box_iou_batch(target_contents, prediction_contents) + elif self._metric_target == MetricTarget.MASKS: + iou = mask_iou_batch(target_contents, prediction_contents) + elif self._metric_target == MetricTarget.ORIENTED_BOUNDING_BOXES: + iou = oriented_box_iou_batch( + target_contents, prediction_contents + ) + else: + raise ValueError( + "Unsupported metric target for IoU calculation" + ) + + matches = self._match_detection_batch( + predictions.class_id, targets.class_id, iou, iou_thresholds + ) + stats.append( + ( + matches, + predictions.confidence, + predictions.class_id, + targets.class_id, + ) + ) + + if not stats: + return MeanAverageRecallResult( + metric_target=self._metric_target, + recall_scores=np.zeros(iou_thresholds.shape[0]), + recall_per_class=np.zeros((0, iou_thresholds.shape[0])), + max_detections=self.max_detections, + iou_thresholds=iou_thresholds, + matched_classes=np.array([], dtype=int), + small_objects=None, + medium_objects=None, + large_objects=None, + ) + + concatenated_stats = [np.concatenate(items, 0) for items in zip(*stats)] + recall_scores_per_k, recall_per_class, unique_classes = ( + self._compute_average_recall_for_classes(*concatenated_stats) + ) + + return MeanAverageRecallResult( + metric_target=self._metric_target, + recall_scores=recall_scores_per_k, + recall_per_class=recall_per_class, + max_detections=self.max_detections, + iou_thresholds=iou_thresholds, + matched_classes=unique_classes, + small_objects=None, + medium_objects=None, + large_objects=None, + ) + + def _compute_average_recall_for_classes( + self, + matches: np.ndarray, + prediction_confidence: np.ndarray, + prediction_class_ids: np.ndarray, + true_class_ids: np.ndarray, + ) -> Tuple[np.ndarray, np.ndarray, np.ndarray]: + sorted_indices = np.argsort(-prediction_confidence) + matches = matches[sorted_indices] + prediction_class_ids = prediction_class_ids[sorted_indices] + unique_classes, class_counts = np.unique(true_class_ids, return_counts=True) + + recalls_at_k = [] + for max_detections in self.max_detections: + # Shape: PxTh,P,C,C -> CxThx3 + confusion_matrix = self._compute_confusion_matrix( + matches, + prediction_class_ids, + unique_classes, + class_counts, + max_detections=max_detections, + ) + + # Shape: CxThx3 -> CxTh + recall_per_class = self._compute_recall(confusion_matrix) + recalls_at_k.append(recall_per_class) + + # Shape: KxCxTh -> KxC + recalls_at_k = np.array(recalls_at_k) + average_recall_per_class = np.mean(recalls_at_k, axis=2) + + # Shape: KxC -> K + recall_scores = np.mean(average_recall_per_class, axis=1) + + return recall_scores, recall_per_class, unique_classes + + @staticmethod + def _match_detection_batch( + predictions_classes: np.ndarray, + target_classes: np.ndarray, + iou: np.ndarray, + iou_thresholds: np.ndarray, + ) -> np.ndarray: + num_predictions, num_iou_levels = ( + predictions_classes.shape[0], + iou_thresholds.shape[0], + ) + correct = np.zeros((num_predictions, num_iou_levels), dtype=bool) + correct_class = target_classes[:, None] == predictions_classes + + for i, iou_level in enumerate(iou_thresholds): + matched_indices = np.where((iou >= iou_level) & correct_class) + + if matched_indices[0].shape[0]: + combined_indices = np.stack(matched_indices, axis=1) + iou_values = iou[matched_indices][:, None] + matches = np.hstack([combined_indices, iou_values]) + + if matched_indices[0].shape[0] > 1: + matches = matches[matches[:, 2].argsort()[::-1]] + matches = matches[np.unique(matches[:, 1], return_index=True)[1]] + matches = matches[np.unique(matches[:, 0], return_index=True)[1]] + + correct[matches[:, 1].astype(int), i] = True + + return correct + + @staticmethod + def _compute_confusion_matrix( + sorted_matches: np.ndarray, + sorted_prediction_class_ids: np.ndarray, + unique_classes: np.ndarray, + class_counts: np.ndarray, + max_detections: Optional[int] = None, + ) -> np.ndarray: + num_thresholds = sorted_matches.shape[1] + num_classes = unique_classes.shape[0] + + confusion_matrix = np.zeros((num_classes, num_thresholds, 3)) + for class_idx, class_id in enumerate(unique_classes): + is_class = sorted_prediction_class_ids == class_id + num_true = class_counts[class_idx] + num_predictions = is_class.sum() + + if num_predictions == 0: + true_positives = np.zeros(num_thresholds) + false_positives = np.zeros(num_thresholds) + false_negatives = np.full(num_thresholds, num_true) + elif num_true == 0: + true_positives = np.zeros(num_thresholds) + false_positives = np.full(num_thresholds, num_predictions) + false_negatives = np.zeros(num_thresholds) + else: + limited_matches = sorted_matches[is_class][slice(max_detections)] + true_positives = limited_matches.sum(0) + + false_positives = (1 - limited_matches).sum(0) + false_negatives = num_true - true_positives + false_negatives = num_true - true_positives + confusion_matrix[class_idx] = np.stack( + [true_positives, false_positives, false_negatives], axis=1 + ) + + return confusion_matrix + + @staticmethod + def _compute_recall(confusion_matrix: np.ndarray) -> np.ndarray: + """ + Broadcastable function, computing the recall from the confusion matrix. + + Arguments: + confusion_matrix: np.ndarray, shape (N, ..., 3), where the last dimension + contains the true positives, false positives, and false negatives. + + Returns: + np.ndarray, shape (N, ...), containing the recall for each element. + """ + if not confusion_matrix.shape[-1] == 3: + raise ValueError( + f"Confusion matrix must have shape (..., 3), got " + f"{confusion_matrix.shape}" + ) + true_positives = confusion_matrix[..., 0] + false_negatives = confusion_matrix[..., 2] + + denominator = true_positives + false_negatives + recall = np.where(denominator == 0, 0, true_positives / denominator) + + return recall + + def _detections_content(self, detections: Detections) -> np.ndarray: + """Return boxes, masks or oriented bounding boxes from detections.""" + if self._metric_target == MetricTarget.BOXES: + return detections.xyxy + if self._metric_target == MetricTarget.MASKS: + return ( + detections.mask + if detections.mask is not None + else self._make_empty_content() + ) + if self._metric_target == MetricTarget.ORIENTED_BOUNDING_BOXES: + obb = detections.data.get(ORIENTED_BOX_COORDINATES) + if obb is not None and len(obb) > 0: + return np.array(obb, dtype=np.float32) + return self._make_empty_content() + raise ValueError(f"Invalid metric target: {self._metric_target}") + + def _make_empty_content(self) -> np.ndarray: + if self._metric_target == MetricTarget.BOXES: + return np.empty((0, 4), dtype=np.float32) + if self._metric_target == MetricTarget.MASKS: + return np.empty((0, 0, 0), dtype=bool) + if self._metric_target == MetricTarget.ORIENTED_BOUNDING_BOXES: + return np.empty((0, 4, 2), dtype=np.float32) + raise ValueError(f"Invalid metric target: {self._metric_target}") + + def _filter_detections_by_size( + self, detections: Detections, size_category: ObjectSizeCategory + ) -> Detections: + """Return a copy of detections with contents filtered by object size.""" + new_detections = deepcopy(detections) + if detections.is_empty() or size_category == ObjectSizeCategory.ANY: + return new_detections + + sizes = get_detection_size_category(new_detections, self._metric_target) + size_mask = sizes == size_category.value + + new_detections.xyxy = new_detections.xyxy[size_mask] + if new_detections.mask is not None: + new_detections.mask = new_detections.mask[size_mask] + if new_detections.class_id is not None: + new_detections.class_id = new_detections.class_id[size_mask] + if new_detections.confidence is not None: + new_detections.confidence = new_detections.confidence[size_mask] + if new_detections.tracker_id is not None: + new_detections.tracker_id = new_detections.tracker_id[size_mask] + if new_detections.data is not None: + for key, value in new_detections.data.items(): + new_detections.data[key] = np.array(value)[size_mask] + + return new_detections + + def _filter_predictions_and_targets_by_size( + self, + predictions_list: List[Detections], + targets_list: List[Detections], + size_category: ObjectSizeCategory, + ) -> Tuple[List[Detections], List[Detections]]: + new_predictions_list = [] + new_targets_list = [] + for predictions, targets in zip(predictions_list, targets_list): + new_predictions_list.append( + self._filter_detections_by_size(predictions, size_category) + ) + new_targets_list.append( + self._filter_detections_by_size(targets, size_category) + ) + return new_predictions_list, new_targets_list + + +@dataclass +class MeanAverageRecallResult: + metric_target: MetricTarget + + @property + def mAR_at_1(self) -> float: + return self.recall_scores[0] + + @property + def mAR_at_10(self) -> float: + return self.recall_scores[1] + + @property + def mAR_at_100(self) -> float: + return self.recall_scores[2] + + recall_scores: np.ndarray + recall_per_class: np.ndarray + max_detections: np.ndarray + iou_thresholds: np.ndarray + matched_classes: np.ndarray + + small_objects: Optional[MeanAverageRecallResult] + medium_objects: Optional[MeanAverageRecallResult] + large_objects: Optional[MeanAverageRecallResult] + + def __str__(self) -> str: + out_str = ( + f"{self.__class__.__name__}:\n" + f"Metric target: {self.metric_target}\n" + f"mAR @ 1: {self.mAR_at_1:.4f}\n" + f"mAR @ 10: {self.mAR_at_10:.4f}\n" + f"mAR @ 100: {self.mAR_at_100:.4f}\n" + f"max detections: {self.max_detections}\n" + f"IoU thresh: {self.iou_thresholds}\n" + f"mAR per class:\n" + ) + if self.recall_per_class.size == 0: + out_str += " No results\n" + for class_id, recall_of_class in zip( + self.matched_classes, self.recall_per_class + ): + out_str += f" {class_id}: {recall_of_class}\n" + + indent = " " + if self.small_objects is not None: + indented = indent + str(self.small_objects).replace("\n", f"\n{indent}") + out_str += f"\nSmall objects:\n{indented}" + if self.medium_objects is not None: + indented = indent + str(self.medium_objects).replace("\n", f"\n{indent}") + out_str += f"\nMedium objects:\n{indented}" + if self.large_objects is not None: + indented = indent + str(self.large_objects).replace("\n", f"\n{indent}") + out_str += f"\nLarge objects:\n{indented}" + + return out_str + + def to_pandas(self) -> "pd.DataFrame": + ensure_pandas_installed() + import pandas as pd + + pandas_data = { + "mAR @ 1": self.mAR_at_1, + "mAR @ 10": self.mAR_at_10, + "mAR @ 100": self.mAR_at_100, + } + + if self.small_objects is not None: + small_objects_df = self.small_objects.to_pandas() + for key, value in small_objects_df.items(): + pandas_data[f"small_objects_{key}"] = value + if self.medium_objects is not None: + medium_objects_df = self.medium_objects.to_pandas() + for key, value in medium_objects_df.items(): + pandas_data[f"medium_objects_{key}"] = value + if self.large_objects is not None: + large_objects_df = self.large_objects.to_pandas() + for key, value in large_objects_df.items(): + pandas_data[f"large_objects_{key}"] = value + + return pd.DataFrame(pandas_data, index=[0]) + + def plot(self): + labels = ["mAR @ 1", "mAR @ 10", "mAR @ 100"] + values = [self.mAR_at_1, self.mAR_at_10, self.mAR_at_100] + colors = [LEGACY_COLOR_PALETTE[0]] * 3 + + if self.small_objects is not None: + small_objects = self.small_objects + labels += ["Small: mAR @ 1", "Small: mAR @ 10", "Small: mAR @ 100"] + values += [ + small_objects.mAR_at_1, + small_objects.mAR_at_10, + small_objects.mAR_at_100, + ] + colors += [LEGACY_COLOR_PALETTE[3]] * 3 + + if self.medium_objects is not None: + medium_objects = self.medium_objects + labels += ["Medium: mAR @ 1", "Medium: mAR @ 10", "Medium: mAR @ 100"] + values += [ + medium_objects.mAR_at_1, + medium_objects.mAR_at_10, + medium_objects.mAR_at_100, + ] + colors += [LEGACY_COLOR_PALETTE[2]] * 3 + + if self.large_objects is not None: + large_objects = self.large_objects + labels += ["Large: mAR @ 1", "Large: mAR @ 10", "Large: mAR @ 100"] + values += [ + large_objects.mAR_at_1, + large_objects.mAR_at_10, + large_objects.mAR_at_100, + ] + colors += [LEGACY_COLOR_PALETTE[4]] * 3 + + plt.rcParams["font.family"] = "monospace" + + _, ax = plt.subplots(figsize=(10, 6)) + ax.set_ylim(0, 1) + ax.set_ylabel("Value", fontweight="bold") + title = ( + f"Mean Average Recall, by Object Size" + f"\n(target: {self.metric_target.value}" + ) + ax.set_title(title, fontweight="bold") + + x_positions = range(len(labels)) + bars = ax.bar(x_positions, values, color=colors, align="center") + + ax.set_xticks(x_positions) + ax.set_xticklabels(labels, rotation=45, ha="right") + + for bar in bars: + y_value = bar.get_height() + ax.text( + bar.get_x() + bar.get_width() / 2, + y_value + 0.02, + f"{y_value:.2f}", + ha="center", + va="bottom", + ) + + plt.rcParams["font.family"] = "sans-serif" + + plt.tight_layout() + plt.show() From 0bfcdeab6f19ae282f9cf448f45aa9fca9ddd663 Mon Sep 17 00:00:00 2001 From: LinasKo Date: Fri, 8 Nov 2024 01:01:52 +0200 Subject: [PATCH 2/2] Add mAR docstrings & examples --- docs/metrics/f1_score.md | 1 - docs/metrics/mean_average_precision.md | 1 - docs/metrics/mean_average_recall.md | 18 ++ mkdocs.yml | 1 + supervision/metrics/mean_average_recall.py | 189 ++++++++++++++++++++- supervision/metrics/recall.py | 4 +- 6 files changed, 208 insertions(+), 6 deletions(-) create mode 100644 docs/metrics/mean_average_recall.md diff --git a/docs/metrics/f1_score.md b/docs/metrics/f1_score.md index e31a95577..5cf0cd77f 100644 --- a/docs/metrics/f1_score.md +++ b/docs/metrics/f1_score.md @@ -1,6 +1,5 @@ --- comments: true -status: new --- # F1 Score diff --git a/docs/metrics/mean_average_precision.md b/docs/metrics/mean_average_precision.md index 817591a19..9e23045e4 100644 --- a/docs/metrics/mean_average_precision.md +++ b/docs/metrics/mean_average_precision.md @@ -1,6 +1,5 @@ --- comments: true -status: new --- # Mean Average Precision diff --git a/docs/metrics/mean_average_recall.md b/docs/metrics/mean_average_recall.md new file mode 100644 index 000000000..5cc0bf0a2 --- /dev/null +++ b/docs/metrics/mean_average_recall.md @@ -0,0 +1,18 @@ +--- +comments: true +status: new +--- + +# Mean Average Recall + + + +:::supervision.metrics.mean_average_recall.MeanAverageRecall + + + +:::supervision.metrics.mean_average_recall.MeanAverageRecallResult diff --git a/mkdocs.yml b/mkdocs.yml index 8c939cf07..1ed9fafa3 100644 --- a/mkdocs.yml +++ b/mkdocs.yml @@ -66,6 +66,7 @@ nav: - Utils: datasets/utils.md - Metrics: - mAP: metrics/mean_average_precision.md + - mAR: metrics/mean_average_recall.md - Precision: metrics/precision.md - Recall: metrics/recall.md - F1 Score: metrics/f1_score.md diff --git a/supervision/metrics/mean_average_recall.py b/supervision/metrics/mean_average_recall.py index 5f0274aec..9c3a40718 100644 --- a/supervision/metrics/mean_average_recall.py +++ b/supervision/metrics/mean_average_recall.py @@ -27,10 +27,64 @@ class MeanAverageRecall(Metric): + """ + Mean Average Recall (mAR) measures how well the model detects + and retrieves relevant objects by averaging recall over multiple + IoU thresholds, classes and detection limits. + + Intuitively, while Recall measures the ability to find all relevant + objects, mAR narrows down how many detections are considered for each + class. For example, mAR @ 100 considers the top 100 highest confidence + detections for each class. mAR @ 1 considers only the highest + confidence detection for each class. + + Example: + ```python + import supervision as sv + from supervision.metrics import MeanAverageRecall + + predictions = sv.Detections(...) + targets = sv.Detections(...) + + map_metric = MeanAverageRecall() + map_result = map_metric.update(predictions, targets).compute() + + print(mar_results.mar_at_100) + # 0.5241 + + print(mar_results) + # MeanAverageRecallResult: + # Metric target: MetricTarget.BOXES + # mAR @ 1: 0.1362 + # mAR @ 10: 0.4239 + # mAR @ 100: 0.5241 + # max detections: [1 10 100] + # IoU thresh: [0.5 0.55 0.6 ...] + # mAR per class: + # 0: [0.78571 0.78571 0.78571 ...] + # ... + # Small objects: ... + # Medium objects: ... + # Large objects: ... + + mar_results.plot() + ``` + + ![example_plot](\ + https://media.roboflow.com/supervision-docs/metrics/mAR_plot_example.png\ + ){ align=center width="800" } + """ + def __init__( self, metric_target: MetricTarget = MetricTarget.BOXES, ): + """ + Initialize the Mean Average Recall metric. + + Args: + metric_target (MetricTarget): The type of detection data to use. + """ self._metric_target = metric_target self._predictions_list: List[Detections] = [] @@ -39,6 +93,9 @@ def __init__( self.max_detections = np.array([1, 10, 100]) def reset(self) -> None: + """ + Reset the metric to its initial state, clearing all stored data. + """ self._predictions_list = [] self._targets_list = [] @@ -47,6 +104,16 @@ def update( predictions: Union[Detections, List[Detections]], targets: Union[Detections, List[Detections]], ) -> MeanAverageRecall: + """ + Add new predictions and targets to the metric, but do not compute the result. + + Args: + predictions (Union[Detections, List[Detections]]): The predicted detections. + targets (Union[Detections, List[Detections]]): The target detections. + + Returns: + (Recall): The updated metric instance. + """ if not isinstance(predictions, list): predictions = [predictions] if not isinstance(targets, list): @@ -64,6 +131,13 @@ def update( return self def compute(self) -> MeanAverageRecallResult: + """ + Calculate the Mean Average Recall metric based on the stored predictions + and ground-truth, at different IoU thresholds and maximum detection counts. + + Returns: + (MeanAverageRecallResult): The Mean Average Recall metric result. + """ result = self._compute(self._predictions_list, self._targets_list) small_predictions, small_targets = self._filter_predictions_and_targets_by_size( @@ -237,6 +311,29 @@ def _compute_confusion_matrix( class_counts: np.ndarray, max_detections: Optional[int] = None, ) -> np.ndarray: + """ + Compute the confusion matrix for each class and IoU threshold. + + Assumes the matches and prediction_class_ids are sorted by confidence + in descending order. + + Args: + sorted_matches: np.ndarray, bool, shape (P, Th), that is True + if the prediction is a true positive at the given IoU threshold. + sorted_prediction_class_ids: np.ndarray, int, shape (P,), containing + the class id for each prediction. + unique_classes: np.ndarray, int, shape (C,), containing the unique + class ids. + class_counts: np.ndarray, int, shape (C,), containing the number + of true instances for each class. + max_detections: Optional[int], the maximum number of detections to + consider for each class. Extra detections are considered false + positives. By default, all detections are considered. + + Returns: + np.ndarray, shape (C, Th, 3), containing the true positives, false + positives, and false negatives for each class and IoU threshold. + """ num_thresholds = sorted_matches.shape[1] num_classes = unique_classes.shape[0] @@ -364,6 +461,61 @@ def _filter_predictions_and_targets_by_size( @dataclass class MeanAverageRecallResult: + # """ + # The results of the recall metric calculation. + + # Defaults to `0` if no detections or targets were provided. + + # Attributes: + # metric_target (MetricTarget): the type of data used for the metric - + # boxes, masks or oriented bounding boxes. + # averaging_method (AveragingMethod): the averaging method used to compute the + # recall. Determines how the recall is aggregated across classes. + # recall_at_50 (float): the recall at IoU threshold of `0.5`. + # recall_at_75 (float): the recall at IoU threshold of `0.75`. + # recall_scores (np.ndarray): the recall scores at each IoU threshold. + # Shape: `(num_iou_thresholds,)` + # recall_per_class (np.ndarray): the recall scores per class and IoU threshold. + # Shape: `(num_target_classes, num_iou_thresholds)` + # iou_thresholds (np.ndarray): the IoU thresholds used in the calculations. + # matched_classes (np.ndarray): the class IDs of all matched classes. + # Corresponds to the rows of `recall_per_class`. + # small_objects (Optional[RecallResult]): the Recall metric results + # for small objects. + # medium_objects (Optional[RecallResult]): the Recall metric results + # for medium objects. + # large_objects (Optional[RecallResult]): the Recall metric results + # for large objects. + # """ + """ + The results of the Mean Average Recall metric calculation. + + Defaults to `0` if no detections or targets were provided. + + Attributes: + metric_target (MetricTarget): the type of data used for the metric - + boxes, masks or oriented bounding boxes. + mAR_at_1 (float): the Mean Average Recall, when considering only the top + highest confidence detection for each class. + mAR_at_10 (float): the Mean Average Recall, when considering top 10 + highest confidence detections for each class. + mAR_at_100 (float): the Mean Average Recall, when considering top 100 + highest confidence detections for each class. + recall_per_class (np.ndarray): the recall scores per class and IoU threshold. + Shape: `(num_target_classes, num_iou_thresholds)` + max_detections (np.ndarray): the array with maximum number of detections + considered. + iou_thresholds (np.ndarray): the IoU thresholds used in the calculations. + matched_classes (np.ndarray): the class IDs of all matched classes. + Corresponds to the rows of `recall_per_class`. + small_objects (Optional[MeanAverageRecallResult]): the Mean Average Recall + metric results for small objects (area < 32²). + medium_objects (Optional[MeanAverageRecallResult]): the Mean Average Recall + metric results for medium objects (32² ≤ area < 96²). + large_objects (Optional[MeanAverageRecallResult]): the Mean Average Recall + metric results for large objects (area ≥ 96²). + """ + metric_target: MetricTarget @property @@ -389,9 +541,29 @@ def mAR_at_100(self) -> float: large_objects: Optional[MeanAverageRecallResult] def __str__(self) -> str: + """ + Format as a pretty string. + + Example: + ```python + # MeanAverageRecallResult: + # Metric target: MetricTarget.BOXES + # mAR @ 1: 0.1362 + # mAR @ 10: 0.4239 + # mAR @ 100: 0.5241 + # max detections: [1 10 100] + # IoU thresh: [0.5 0.55 0.6 ...] + # mAR per class: + # 0: [0.78571 0.78571 0.78571 ...] + # ... + # Small objects: ... + # Medium objects: ... + # Large objects: ... + ``` + """ out_str = ( f"{self.__class__.__name__}:\n" - f"Metric target: {self.metric_target}\n" + f"Metric target: {self.metric_target}\n" f"mAR @ 1: {self.mAR_at_1:.4f}\n" f"mAR @ 10: {self.mAR_at_10:.4f}\n" f"mAR @ 100: {self.mAR_at_100:.4f}\n" @@ -420,6 +592,12 @@ def __str__(self) -> str: return out_str def to_pandas(self) -> "pd.DataFrame": + """ + Convert the result to a pandas DataFrame. + + Returns: + (pd.DataFrame): The result as a DataFrame. + """ ensure_pandas_installed() import pandas as pd @@ -445,6 +623,13 @@ def to_pandas(self) -> "pd.DataFrame": return pd.DataFrame(pandas_data, index=[0]) def plot(self): + """ + Plot the Mean Average Recall results. + + ![example_plot](\ + https://media.roboflow.com/supervision-docs/metrics/mAR_plot_example.png\ + ){ align=center width="800" } + """ labels = ["mAR @ 1", "mAR @ 10", "mAR @ 100"] values = [self.mAR_at_1, self.mAR_at_10, self.mAR_at_100] colors = [LEGACY_COLOR_PALETTE[0]] * 3 @@ -486,7 +671,7 @@ def plot(self): ax.set_ylabel("Value", fontweight="bold") title = ( f"Mean Average Recall, by Object Size" - f"\n(target: {self.metric_target.value}" + f"\n(target: {self.metric_target.value})" ) ax.set_title(title, fontweight="bold") diff --git a/supervision/metrics/recall.py b/supervision/metrics/recall.py index 1848502b7..21bba1a6e 100644 --- a/supervision/metrics/recall.py +++ b/supervision/metrics/recall.py @@ -115,11 +115,11 @@ def update( def compute(self) -> RecallResult: """ - Calculate the precision metric based on the stored predictions and ground-truth + Calculate the recall metric based on the stored predictions and ground-truth data, at different IoU thresholds. Returns: - (RecallResult): The precision metric result. + (RecallResult): The recall metric result. """ result = self._compute(self._predictions_list, self._targets_list)