Metrics

`Metric` `dataclass`

Bases: BaseMetric

Object Detection Metric.

Attributes:

Name	Type	Description
`type`	`str`	The metric type.
`value`	`int \| float \| dict`	The metric value.
`parameters`	`dict[str, Any]`	A dictionary containing metric parameters.

Source code in valor_lite/object_detection/metric.py

@dataclass
class Metric(BaseMetric):
    """
    Object Detection Metric.

    Attributes
    ----------
    type : str
        The metric type.
    value : int | float | dict
        The metric value.
    parameters : dict[str, Any]
        A dictionary containing metric parameters.
    """

    def __post_init__(self):
        if not isinstance(self.type, str):
            raise TypeError(
                f"Metric type should be of type 'str': {self.type}"
            )
        elif not isinstance(self.value, (int, float, dict)):
            raise TypeError(
                f"Metric value must be of type 'int', 'float' or 'dict': {self.value}"
            )
        elif not isinstance(self.parameters, dict):
            raise TypeError(
                f"Metric parameters must be of type 'dict[str, Any]': {self.parameters}"
            )
        elif not all([isinstance(k, str) for k in self.parameters.keys()]):
            raise TypeError(
                f"Metric parameter dictionary should only have keys with type 'str': {self.parameters}"
            )

    @classmethod
    def precision(
        cls,
        value: float,
        label: str,
        iou_threshold: float,
        score_threshold: float,
    ):
        """
        Precision metric for a specific class label in object detection.

        This class encapsulates a metric value for a particular class label,
        along with the associated Intersection over Union (IOU) threshold and
        confidence score threshold.

        Parameters
        ----------
        value : float
            The metric value.
        label : str
            The class label for which the metric is calculated.
        iou_threshold : float
            The IOU threshold used to determine matches between predicted and ground truth boxes.
        score_threshold : float
            The confidence score threshold above which predictions are considered.

        Returns
        -------
        Metric
        """
        return cls(
            type=MetricType.Precision.value,
            value=value,
            parameters={
                "label": label,
                "iou_threshold": iou_threshold,
                "score_threshold": score_threshold,
            },
        )

    @classmethod
    def recall(
        cls,
        value: float,
        label: str,
        iou_threshold: float,
        score_threshold: float,
    ):
        """
        Recall metric for a specific class label in object detection.

        This class encapsulates a metric value for a particular class label,
        along with the associated Intersection over Union (IOU) threshold and
        confidence score threshold.

        Parameters
        ----------
        value : float
            The metric value.
        label : str
            The class label for which the metric is calculated.
        iou_threshold : float
            The IOU threshold used to determine matches between predicted and ground truth boxes.
        score_threshold : float
            The confidence score threshold above which predictions are considered.

        Returns
        -------
        Metric
        """
        return cls(
            type=MetricType.Recall.value,
            value=value,
            parameters={
                "label": label,
                "iou_threshold": iou_threshold,
                "score_threshold": score_threshold,
            },
        )

    @classmethod
    def f1_score(
        cls,
        value: float,
        label: str,
        iou_threshold: float,
        score_threshold: float,
    ):
        """
        F1 score for a specific class label in object detection.

        This class encapsulates a metric value for a particular class label,
        along with the associated Intersection over Union (IOU) threshold and
        confidence score threshold.

        Parameters
        ----------
        value : float
            The metric value.
        label : str
            The class label for which the metric is calculated.
        iou_threshold : float
            The IOU threshold used to determine matches between predicted and ground truth boxes.
        score_threshold : float
            The confidence score threshold above which predictions are considered.

        Returns
        -------
        Metric
        """
        return cls(
            type=MetricType.F1.value,
            value=value,
            parameters={
                "label": label,
                "iou_threshold": iou_threshold,
                "score_threshold": score_threshold,
            },
        )

    @classmethod
    def average_precision(
        cls,
        value: float,
        iou_threshold: float,
        label: str,
    ):
        """
        Average Precision (AP) metric for object detection tasks.

        The AP computation uses 101-point interpolation, which calculates the average
        precision by interpolating the precision-recall curve at 101 evenly spaced recall
        levels from 0 to 1.

        Parameters
        ----------
        value : float
            The average precision value.
        iou_threshold : float
            The IOU threshold used to compute the AP.
        label : str
            The class label for which the AP is computed.

        Returns
        -------
        Metric
        """
        return cls(
            type=MetricType.AP.value,
            value=value,
            parameters={
                "iou_threshold": iou_threshold,
                "label": label,
            },
        )

    @classmethod
    def mean_average_precision(
        cls,
        value: float,
        iou_threshold: float,
    ):
        """
        Mean Average Precision (mAP) metric for object detection tasks.

        The AP computation uses 101-point interpolation, which calculates the average
        precision for each class by interpolating the precision-recall curve at 101 evenly
        spaced recall levels from 0 to 1. The mAP is then calculated by averaging these
        values across all class labels.

        Parameters
        ----------
        value : float
            The mean average precision value.
        iou_threshold : float
            The IOU threshold used to compute the mAP.

        Returns
        -------
        Metric
        """
        return cls(
            type=MetricType.mAP.value,
            value=value,
            parameters={
                "iou_threshold": iou_threshold,
            },
        )

    @classmethod
    def average_precision_averaged_over_IOUs(
        cls,
        value: float,
        iou_thresholds: list[float],
        label: str,
    ):
        """
        Average Precision (AP) metric averaged over multiple IOU thresholds.

        The AP computation uses 101-point interpolation, which calculates the average precision
        by interpolating the precision-recall curve at 101 evenly spaced recall levels from 0 to 1
        for each IOU threshold specified in `iou_thresholds`. The final APAveragedOverIOUs value is
        obtained by averaging these AP values across all specified IOU thresholds.

        Parameters
        ----------
        value : float
            The average precision value averaged over the specified IOU thresholds.
        iou_thresholds : list[float]
            The list of IOU thresholds used to compute the AP values.
        label : str
            The class label for which the AP is computed.

        Returns
        -------
        Metric
        """
        return cls(
            type=MetricType.APAveragedOverIOUs.value,
            value=value,
            parameters={
                "iou_thresholds": iou_thresholds,
                "label": label,
            },
        )

    @classmethod
    def mean_average_precision_averaged_over_IOUs(
        cls,
        value: float,
        iou_thresholds: list[float],
    ):
        """
        Mean Average Precision (mAP) metric averaged over multiple IOU thresholds.

        The AP computation uses 101-point interpolation, which calculates the average precision
        by interpolating the precision-recall curve at 101 evenly spaced recall levels from 0 to 1
        for each IOU threshold specified in `iou_thresholds`. The final mAPAveragedOverIOUs value is
        obtained by averaging these AP values across all specified IOU thresholds and all class labels.

        Parameters
        ----------
        value : float
            The average precision value averaged over the specified IOU thresholds.
        iou_thresholds : list[float]
            The list of IOU thresholds used to compute the AP values.

        Returns
        -------
        Metric
        """
        return cls(
            type=MetricType.mAPAveragedOverIOUs.value,
            value=value,
            parameters={
                "iou_thresholds": iou_thresholds,
            },
        )

    @classmethod
    def average_recall(
        cls,
        value: float,
        score_threshold: float,
        iou_thresholds: list[float],
        label: str,
    ):
        """
        Average Recall (AR) metric for object detection tasks.

        The AR computation considers detections with confidence scores above the specified
        `score_threshold` and calculates the recall at each IOU threshold in `iou_thresholds`.
        The final AR value is the average of these recall values across all specified IOU
        thresholds.

        Parameters
        ----------
        value : float
            The average recall value averaged over the specified IOU thresholds.
        score_threshold : float
            The detection score threshold; only detections with confidence scores above this
            threshold are considered.
        iou_thresholds : list[float]
            The list of IOU thresholds used to compute the recall values.
        label : str
            The class label for which the AR is computed.

        Returns
        -------
        Metric
        """
        return cls(
            type=MetricType.AR.value,
            value=value,
            parameters={
                "iou_thresholds": iou_thresholds,
                "score_threshold": score_threshold,
                "label": label,
            },
        )

    @classmethod
    def mean_average_recall(
        cls,
        value: float,
        score_threshold: float,
        iou_thresholds: list[float],
    ):
        """
        Mean Average Recall (mAR) metric for object detection tasks.

        The mAR computation considers detections with confidence scores above the specified
        `score_threshold` and calculates recall at each IOU threshold in `iou_thresholds` for
        each label. The final mAR value is obtained by averaging these recall values over the
        specified IOU thresholds and then averaging across all labels.

        Parameters
        ----------
        value : float
            The mean average recall value averaged over the specified IOU thresholds.
        score_threshold : float
            The detection score threshold; only detections with confidence scores above this
            threshold are considered.
        iou_thresholds : list[float]
            The list of IOU thresholds used to compute the recall values.

        Returns
        -------
        Metric
        """
        return cls(
            type=MetricType.mAR.value,
            value=value,
            parameters={
                "iou_thresholds": iou_thresholds,
                "score_threshold": score_threshold,
            },
        )

    @classmethod
    def average_recall_averaged_over_scores(
        cls,
        value: float,
        score_thresholds: list[float],
        iou_thresholds: list[float],
        label: str,
    ):
        """
        Average Recall (AR) metric averaged over multiple score thresholds for a specific object class label.

        The AR computation considers detections across multiple `score_thresholds` and calculates
        recall at each IOU threshold in `iou_thresholds`. The final AR value is obtained by averaging
        the recall values over all specified score thresholds and IOU thresholds.

        Parameters
        ----------
        value : float
            The average recall value averaged over the specified score thresholds and IOU thresholds.
        score_thresholds : list[float]
            The list of detection score thresholds; detections with confidence scores above each threshold are considered.
        iou_thresholds : list[float]
            The list of IOU thresholds used to compute the recall values.
        label : str
            The class label for which the AR is computed.

        Returns
        -------
        Metric
        """
        return cls(
            type=MetricType.ARAveragedOverScores.value,
            value=value,
            parameters={
                "iou_thresholds": iou_thresholds,
                "score_thresholds": score_thresholds,
                "label": label,
            },
        )

    @classmethod
    def mean_average_recall_averaged_over_scores(
        cls,
        value: float,
        score_thresholds: list[float],
        iou_thresholds: list[float],
    ):
        """
        Mean Average Recall (mAR) metric averaged over multiple score thresholds and IOU thresholds.

        The mAR computation considers detections across multiple `score_thresholds`, calculates recall
        at each IOU threshold in `iou_thresholds` for each label, averages these recall values over all
        specified score thresholds and IOU thresholds, and then computes the mean across all labels to
        obtain the final mAR value.

        Parameters
        ----------
        value : float
            The mean average recall value averaged over the specified score thresholds and IOU thresholds.
        score_thresholds : list[float]
            The list of detection score thresholds; detections with confidence scores above each threshold are considered.
        iou_thresholds : list[float]
            The list of IOU thresholds used to compute the recall values.

        Returns
        -------
        Metric
        """
        return cls(
            type=MetricType.mARAveragedOverScores.value,
            value=value,
            parameters={
                "iou_thresholds": iou_thresholds,
                "score_thresholds": score_thresholds,
            },
        )

    @classmethod
    def precision_recall_curve(
        cls,
        precisions: list[float],
        scores: list[float],
        iou_threshold: float,
        label: str,
    ):
        """
        Interpolated precision-recall curve over 101 recall points.

        The precision values are interpolated over recalls ranging from 0.0 to 1.0 in steps of 0.01,
        resulting in 101 points. This is a byproduct of the 101-point interpolation used in calculating
        the Average Precision (AP) metric in object detection tasks.

        Parameters
        ----------
        precisions : list[float]
            Interpolated precision values corresponding to recalls at 0.0, 0.01, ..., 1.0.
        scores : list[float]
            Maximum prediction score for each point on the interpolated curve.
        iou_threshold : float
            The Intersection over Union (IOU) threshold used to determine true positives.
        label : str
            The class label associated with this precision-recall curve.

        Returns
        -------
        Metric
        """
        return cls(
            type=MetricType.PrecisionRecallCurve.value,
            value={
                "precisions": precisions,
                "scores": scores,
            },
            parameters={
                "iou_threshold": iou_threshold,
                "label": label,
            },
        )

    @classmethod
    def counts(
        cls,
        tp: int,
        fp: int,
        fn: int,
        label: str,
        iou_threshold: float,
        score_threshold: float,
    ):
        """
        `Counts` encapsulates the counts of true positives (`tp`), false positives (`fp`),
        and false negatives (`fn`) for object detection evaluation, along with the associated
        class label, Intersection over Union (IOU) threshold, and confidence score threshold.

        Parameters
        ----------
        tp : int
            Number of true positives.
        fp : int
            Number of false positives.
        fn : int
            Number of false negatives.
        label : str
            The class label for which the counts are calculated.
        iou_threshold : float
            The IOU threshold used to determine a match between predicted and ground truth boxes.
        score_threshold : float
            The confidence score threshold above which predictions are considered.

        Returns
        -------
        Metric
        """
        return cls(
            type=MetricType.Counts.value,
            value={
                "tp": tp,
                "fp": fp,
                "fn": fn,
            },
            parameters={
                "iou_threshold": iou_threshold,
                "score_threshold": score_threshold,
                "label": label,
            },
        )

    @classmethod
    def confusion_matrix(
        cls,
        confusion_matrix: dict[
            str,  # ground truth label value
            dict[
                str,  # prediction label value
                dict[
                    str,  # either `count` or `examples`
                    int
                    | list[
                        dict[
                            str,  # either `datum_id`, `ground_truth_id`, `prediction_id`
                            str,  # string identifier
                        ]
                    ],
                ],
            ],
        ],
        unmatched_predictions: dict[
            str,  # prediction label value
            dict[
                str,  # either `count` or `examples`
                int
                | list[
                    dict[
                        str,  # either `datum_id` or `prediction_id``
                        str,  # string identifier
                    ]
                ],
            ],
        ],
        unmatched_ground_truths: dict[
            str,  # ground truth label value
            dict[
                str,  # either `count` or `examples`
                int
                | list[
                    dict[
                        str,  # either `datum_id` or `ground_truth_id`
                        str,  # string identifier
                    ]
                ],
            ],
        ],
        score_threshold: float,
        iou_threshold: float,
    ):
        """
        Confusion matrix for object detection tasks.

        This class encapsulates detailed information about the model's performance, including correct
        predictions, misclassifications, unmatched_predictions (subset of false positives), and unmatched ground truths
        (subset of false negatives). It provides counts and examples for each category to facilitate in-depth analysis.

        Confusion Matrix Format:
        {
            <ground truth label>: {
                <prediction label>: {
                    'count': int,
                    'examples': [
                        {
                            'datum_id': str,
                            'groundtruth_id': str,
                            'prediction_id': str
                        },
                        ...
                    ],
                },
                ...
            },
            ...
        }

        Unmatched Predictions Format:
        {
            <prediction label>: {
                'count': int,
                'examples': [
                    {
                        'datum_id': str,
                        'prediction_id': str
                    },
                    ...
                ],
            },
            ...
        }

        Unmatched Ground Truths Format:
        {
            <ground truth label>: {
                'count': int,
                'examples': [
                    {
                        'datum_id': str,
                        'groundtruth_id': str
                    },
                    ...
                ],
            },
            ...
        }

        Parameters
        ----------
        confusion_matrix : dict
            A nested dictionary where the first key is the ground truth label value, the second key
            is the prediction label value, and the innermost dictionary contains either a `count`
            or a list of `examples`. Each example includes annotation and datum identifers.
        unmatched_predictions : dict
            A dictionary where each key is a prediction label value with no corresponding ground truth
            (subset of false positives). The value is a dictionary containing either a `count` or a list of
            `examples`. Each example includes annotation and datum identifers.
        unmatched_ground_truths : dict
            A dictionary where each key is a ground truth label value for which the model failed to predict
            (subset of false negatives). The value is a dictionary containing either a `count` or a list of `examples`.
            Each example includes annotation and datum identifers.
        score_threshold : float
            The confidence score threshold used to filter predictions.
        iou_threshold : float
            The Intersection over Union (IOU) threshold used to determine true positives.

        Returns
        -------
        Metric
        """
        return cls(
            type=MetricType.ConfusionMatrix.value,
            value={
                "confusion_matrix": confusion_matrix,
                "unmatched_predictions": unmatched_predictions,
                "unmatched_ground_truths": unmatched_ground_truths,
            },
            parameters={
                "score_threshold": score_threshold,
                "iou_threshold": iou_threshold,
            },
        )

`average_precision(value, iou_threshold, label)` `classmethod`

Average Precision (AP) metric for object detection tasks.

The AP computation uses 101-point interpolation, which calculates the average precision by interpolating the precision-recall curve at 101 evenly spaced recall levels from 0 to 1.

Parameters:

Name	Type	Description	Default
`value`	`float`	The average precision value.	required
`iou_threshold`	`float`	The IOU threshold used to compute the AP.	required
`label`	`str`	The class label for which the AP is computed.	required

Returns:

Type	Description
`Metric`

Source code in valor_lite/object_detection/metric.py

@classmethod
def average_precision(
    cls,
    value: float,
    iou_threshold: float,
    label: str,
):
    """
    Average Precision (AP) metric for object detection tasks.

    The AP computation uses 101-point interpolation, which calculates the average
    precision by interpolating the precision-recall curve at 101 evenly spaced recall
    levels from 0 to 1.

    Parameters
    ----------
    value : float
        The average precision value.
    iou_threshold : float
        The IOU threshold used to compute the AP.
    label : str
        The class label for which the AP is computed.

    Returns
    -------
    Metric
    """
    return cls(
        type=MetricType.AP.value,
        value=value,
        parameters={
            "iou_threshold": iou_threshold,
            "label": label,
        },
    )

`average_precision_averaged_over_IOUs(value, iou_thresholds, label)` `classmethod`

Average Precision (AP) metric averaged over multiple IOU thresholds.

The AP computation uses 101-point interpolation, which calculates the average precision by interpolating the precision-recall curve at 101 evenly spaced recall levels from 0 to 1 for each IOU threshold specified in iou_thresholds. The final APAveragedOverIOUs value is obtained by averaging these AP values across all specified IOU thresholds.

Parameters:

Name	Type	Description	Default
`value`	`float`	The average precision value averaged over the specified IOU thresholds.	required
`iou_thresholds`	`list[float]`	The list of IOU thresholds used to compute the AP values.	required
`label`	`str`	The class label for which the AP is computed.	required

Returns:

Type	Description
`Metric`

Source code in valor_lite/object_detection/metric.py

@classmethod
def average_precision_averaged_over_IOUs(
    cls,
    value: float,
    iou_thresholds: list[float],
    label: str,
):
    """
    Average Precision (AP) metric averaged over multiple IOU thresholds.

    The AP computation uses 101-point interpolation, which calculates the average precision
    by interpolating the precision-recall curve at 101 evenly spaced recall levels from 0 to 1
    for each IOU threshold specified in `iou_thresholds`. The final APAveragedOverIOUs value is
    obtained by averaging these AP values across all specified IOU thresholds.

    Parameters
    ----------
    value : float
        The average precision value averaged over the specified IOU thresholds.
    iou_thresholds : list[float]
        The list of IOU thresholds used to compute the AP values.
    label : str
        The class label for which the AP is computed.

    Returns
    -------
    Metric
    """
    return cls(
        type=MetricType.APAveragedOverIOUs.value,
        value=value,
        parameters={
            "iou_thresholds": iou_thresholds,
            "label": label,
        },
    )

`average_recall(value, score_threshold, iou_thresholds, label)` `classmethod`

Average Recall (AR) metric for object detection tasks.

The AR computation considers detections with confidence scores above the specified score_threshold and calculates the recall at each IOU threshold in iou_thresholds. The final AR value is the average of these recall values across all specified IOU thresholds.

Parameters:

Name	Type	Description	Default
`value`	`float`	The average recall value averaged over the specified IOU thresholds.	required
`score_threshold`	`float`	The detection score threshold; only detections with confidence scores above this threshold are considered.	required
`iou_thresholds`	`list[float]`	The list of IOU thresholds used to compute the recall values.	required
`label`	`str`	The class label for which the AR is computed.	required

Returns:

Type	Description
`Metric`

Source code in valor_lite/object_detection/metric.py

@classmethod
def average_recall(
    cls,
    value: float,
    score_threshold: float,
    iou_thresholds: list[float],
    label: str,
):
    """
    Average Recall (AR) metric for object detection tasks.

    The AR computation considers detections with confidence scores above the specified
    `score_threshold` and calculates the recall at each IOU threshold in `iou_thresholds`.
    The final AR value is the average of these recall values across all specified IOU
    thresholds.

    Parameters
    ----------
    value : float
        The average recall value averaged over the specified IOU thresholds.
    score_threshold : float
        The detection score threshold; only detections with confidence scores above this
        threshold are considered.
    iou_thresholds : list[float]
        The list of IOU thresholds used to compute the recall values.
    label : str
        The class label for which the AR is computed.

    Returns
    -------
    Metric
    """
    return cls(
        type=MetricType.AR.value,
        value=value,
        parameters={
            "iou_thresholds": iou_thresholds,
            "score_threshold": score_threshold,
            "label": label,
        },
    )

`average_recall_averaged_over_scores(value, score_thresholds, iou_thresholds, label)` `classmethod`

Average Recall (AR) metric averaged over multiple score thresholds for a specific object class label.

The AR computation considers detections across multiple score_thresholds and calculates recall at each IOU threshold in iou_thresholds. The final AR value is obtained by averaging the recall values over all specified score thresholds and IOU thresholds.

Parameters:

Name	Type	Description	Default
`value`	`float`	The average recall value averaged over the specified score thresholds and IOU thresholds.	required
`score_thresholds`	`list[float]`	The list of detection score thresholds; detections with confidence scores above each threshold are considered.	required
`iou_thresholds`	`list[float]`	The list of IOU thresholds used to compute the recall values.	required
`label`	`str`	The class label for which the AR is computed.	required

Returns:

Type	Description
`Metric`

Source code in valor_lite/object_detection/metric.py

@classmethod
def average_recall_averaged_over_scores(
    cls,
    value: float,
    score_thresholds: list[float],
    iou_thresholds: list[float],
    label: str,
):
    """
    Average Recall (AR) metric averaged over multiple score thresholds for a specific object class label.

    The AR computation considers detections across multiple `score_thresholds` and calculates
    recall at each IOU threshold in `iou_thresholds`. The final AR value is obtained by averaging
    the recall values over all specified score thresholds and IOU thresholds.

    Parameters
    ----------
    value : float
        The average recall value averaged over the specified score thresholds and IOU thresholds.
    score_thresholds : list[float]
        The list of detection score thresholds; detections with confidence scores above each threshold are considered.
    iou_thresholds : list[float]
        The list of IOU thresholds used to compute the recall values.
    label : str
        The class label for which the AR is computed.

    Returns
    -------
    Metric
    """
    return cls(
        type=MetricType.ARAveragedOverScores.value,
        value=value,
        parameters={
            "iou_thresholds": iou_thresholds,
            "score_thresholds": score_thresholds,
            "label": label,
        },
    )

`confusion_matrix(confusion_matrix, unmatched_predictions, unmatched_ground_truths, score_threshold, iou_threshold)` `classmethod`

Confusion matrix for object detection tasks.

This class encapsulates detailed information about the model's performance, including correct predictions, misclassifications, unmatched_predictions (subset of false positives), and unmatched ground truths (subset of false negatives). It provides counts and examples for each category to facilitate in-depth analysis.

Confusion Matrix Format: { : { : { 'count': int, 'examples': [ { 'datum_id': str, 'groundtruth_id': str, 'prediction_id': str }, ... ], }, ... }, ... }

Unmatched Predictions Format: { : { 'count': int, 'examples': [ { 'datum_id': str, 'prediction_id': str }, ... ], }, ... }

Unmatched Ground Truths Format: { : { 'count': int, 'examples': [ { 'datum_id': str, 'groundtruth_id': str }, ... ], }, ... }

Parameters:

Name	Type	Description	Default
`confusion_matrix`	`dict`	A nested dictionary where the first key is the ground truth label value, the second key is the prediction label value, and the innermost dictionary contains either a `count` or a list of `examples`. Each example includes annotation and datum identifers.	required
`unmatched_predictions`	`dict`	A dictionary where each key is a prediction label value with no corresponding ground truth (subset of false positives). The value is a dictionary containing either a `count` or a list of `examples`. Each example includes annotation and datum identifers.	required
`unmatched_ground_truths`	`dict`	A dictionary where each key is a ground truth label value for which the model failed to predict (subset of false negatives). The value is a dictionary containing either a `count` or a list of `examples`. Each example includes annotation and datum identifers.	required
`score_threshold`	`float`	The confidence score threshold used to filter predictions.	required
`iou_threshold`	`float`	The Intersection over Union (IOU) threshold used to determine true positives.	required

Returns:

Type	Description
`Metric`

Source code in valor_lite/object_detection/metric.py

@classmethod
def confusion_matrix(
    cls,
    confusion_matrix: dict[
        str,  # ground truth label value
        dict[
            str,  # prediction label value
            dict[
                str,  # either `count` or `examples`
                int
                | list[
                    dict[
                        str,  # either `datum_id`, `ground_truth_id`, `prediction_id`
                        str,  # string identifier
                    ]
                ],
            ],
        ],
    ],
    unmatched_predictions: dict[
        str,  # prediction label value
        dict[
            str,  # either `count` or `examples`
            int
            | list[
                dict[
                    str,  # either `datum_id` or `prediction_id``
                    str,  # string identifier
                ]
            ],
        ],
    ],
    unmatched_ground_truths: dict[
        str,  # ground truth label value
        dict[
            str,  # either `count` or `examples`
            int
            | list[
                dict[
                    str,  # either `datum_id` or `ground_truth_id`
                    str,  # string identifier
                ]
            ],
        ],
    ],
    score_threshold: float,
    iou_threshold: float,
):
    """
    Confusion matrix for object detection tasks.

    This class encapsulates detailed information about the model's performance, including correct
    predictions, misclassifications, unmatched_predictions (subset of false positives), and unmatched ground truths
    (subset of false negatives). It provides counts and examples for each category to facilitate in-depth analysis.

    Confusion Matrix Format:
    {
        <ground truth label>: {
            <prediction label>: {
                'count': int,
                'examples': [
                    {
                        'datum_id': str,
                        'groundtruth_id': str,
                        'prediction_id': str
                    },
                    ...
                ],
            },
            ...
        },
        ...
    }

    Unmatched Predictions Format:
    {
        <prediction label>: {
            'count': int,
            'examples': [
                {
                    'datum_id': str,
                    'prediction_id': str
                },
                ...
            ],
        },
        ...
    }

    Unmatched Ground Truths Format:
    {
        <ground truth label>: {
            'count': int,
            'examples': [
                {
                    'datum_id': str,
                    'groundtruth_id': str
                },
                ...
            ],
        },
        ...
    }

    Parameters
    ----------
    confusion_matrix : dict
        A nested dictionary where the first key is the ground truth label value, the second key
        is the prediction label value, and the innermost dictionary contains either a `count`
        or a list of `examples`. Each example includes annotation and datum identifers.
    unmatched_predictions : dict
        A dictionary where each key is a prediction label value with no corresponding ground truth
        (subset of false positives). The value is a dictionary containing either a `count` or a list of
        `examples`. Each example includes annotation and datum identifers.
    unmatched_ground_truths : dict
        A dictionary where each key is a ground truth label value for which the model failed to predict
        (subset of false negatives). The value is a dictionary containing either a `count` or a list of `examples`.
        Each example includes annotation and datum identifers.
    score_threshold : float
        The confidence score threshold used to filter predictions.
    iou_threshold : float
        The Intersection over Union (IOU) threshold used to determine true positives.

    Returns
    -------
    Metric
    """
    return cls(
        type=MetricType.ConfusionMatrix.value,
        value={
            "confusion_matrix": confusion_matrix,
            "unmatched_predictions": unmatched_predictions,
            "unmatched_ground_truths": unmatched_ground_truths,
        },
        parameters={
            "score_threshold": score_threshold,
            "iou_threshold": iou_threshold,
        },
    )

`counts(tp, fp, fn, label, iou_threshold, score_threshold)` `classmethod`

Counts encapsulates the counts of true positives (tp), false positives (fp), and false negatives (fn) for object detection evaluation, along with the associated class label, Intersection over Union (IOU) threshold, and confidence score threshold.

Parameters:

Name	Type	Description	Default
`tp`	`int`	Number of true positives.	required
`fp`	`int`	Number of false positives.	required
`fn`	`int`	Number of false negatives.	required
`label`	`str`	The class label for which the counts are calculated.	required
`iou_threshold`	`float`	The IOU threshold used to determine a match between predicted and ground truth boxes.	required
`score_threshold`	`float`	The confidence score threshold above which predictions are considered.	required

Returns:

Type	Description
`Metric`

Source code in valor_lite/object_detection/metric.py

@classmethod
def counts(
    cls,
    tp: int,
    fp: int,
    fn: int,
    label: str,
    iou_threshold: float,
    score_threshold: float,
):
    """
    `Counts` encapsulates the counts of true positives (`tp`), false positives (`fp`),
    and false negatives (`fn`) for object detection evaluation, along with the associated
    class label, Intersection over Union (IOU) threshold, and confidence score threshold.

    Parameters
    ----------
    tp : int
        Number of true positives.
    fp : int
        Number of false positives.
    fn : int
        Number of false negatives.
    label : str
        The class label for which the counts are calculated.
    iou_threshold : float
        The IOU threshold used to determine a match between predicted and ground truth boxes.
    score_threshold : float
        The confidence score threshold above which predictions are considered.

    Returns
    -------
    Metric
    """
    return cls(
        type=MetricType.Counts.value,
        value={
            "tp": tp,
            "fp": fp,
            "fn": fn,
        },
        parameters={
            "iou_threshold": iou_threshold,
            "score_threshold": score_threshold,
            "label": label,
        },
    )

`f1_score(value, label, iou_threshold, score_threshold)` `classmethod`

F1 score for a specific class label in object detection.

This class encapsulates a metric value for a particular class label, along with the associated Intersection over Union (IOU) threshold and confidence score threshold.

Parameters:

Name	Type	Description	Default
`value`	`float`	The metric value.	required
`label`	`str`	The class label for which the metric is calculated.	required
`iou_threshold`	`float`	The IOU threshold used to determine matches between predicted and ground truth boxes.	required
`score_threshold`	`float`	The confidence score threshold above which predictions are considered.	required

Returns:

Type	Description
`Metric`

Source code in valor_lite/object_detection/metric.py

@classmethod
def f1_score(
    cls,
    value: float,
    label: str,
    iou_threshold: float,
    score_threshold: float,
):
    """
    F1 score for a specific class label in object detection.

    This class encapsulates a metric value for a particular class label,
    along with the associated Intersection over Union (IOU) threshold and
    confidence score threshold.

    Parameters
    ----------
    value : float
        The metric value.
    label : str
        The class label for which the metric is calculated.
    iou_threshold : float
        The IOU threshold used to determine matches between predicted and ground truth boxes.
    score_threshold : float
        The confidence score threshold above which predictions are considered.

    Returns
    -------
    Metric
    """
    return cls(
        type=MetricType.F1.value,
        value=value,
        parameters={
            "label": label,
            "iou_threshold": iou_threshold,
            "score_threshold": score_threshold,
        },
    )

`mean_average_precision(value, iou_threshold)` `classmethod`

Mean Average Precision (mAP) metric for object detection tasks.

The AP computation uses 101-point interpolation, which calculates the average precision for each class by interpolating the precision-recall curve at 101 evenly spaced recall levels from 0 to 1. The mAP is then calculated by averaging these values across all class labels.

Parameters:

Name	Type	Description	Default
`value`	`float`	The mean average precision value.	required
`iou_threshold`	`float`	The IOU threshold used to compute the mAP.	required

Returns:

Type	Description
`Metric`

Source code in valor_lite/object_detection/metric.py

@classmethod
def mean_average_precision(
    cls,
    value: float,
    iou_threshold: float,
):
    """
    Mean Average Precision (mAP) metric for object detection tasks.

    The AP computation uses 101-point interpolation, which calculates the average
    precision for each class by interpolating the precision-recall curve at 101 evenly
    spaced recall levels from 0 to 1. The mAP is then calculated by averaging these
    values across all class labels.

    Parameters
    ----------
    value : float
        The mean average precision value.
    iou_threshold : float
        The IOU threshold used to compute the mAP.

    Returns
    -------
    Metric
    """
    return cls(
        type=MetricType.mAP.value,
        value=value,
        parameters={
            "iou_threshold": iou_threshold,
        },
    )

`mean_average_precision_averaged_over_IOUs(value, iou_thresholds)` `classmethod`

Mean Average Precision (mAP) metric averaged over multiple IOU thresholds.

The AP computation uses 101-point interpolation, which calculates the average precision by interpolating the precision-recall curve at 101 evenly spaced recall levels from 0 to 1 for each IOU threshold specified in iou_thresholds. The final mAPAveragedOverIOUs value is obtained by averaging these AP values across all specified IOU thresholds and all class labels.

Parameters:

Name	Type	Description	Default
`value`	`float`	The average precision value averaged over the specified IOU thresholds.	required
`iou_thresholds`	`list[float]`	The list of IOU thresholds used to compute the AP values.	required

Returns:

Type	Description
`Metric`

Source code in valor_lite/object_detection/metric.py

@classmethod
def mean_average_precision_averaged_over_IOUs(
    cls,
    value: float,
    iou_thresholds: list[float],
):
    """
    Mean Average Precision (mAP) metric averaged over multiple IOU thresholds.

    The AP computation uses 101-point interpolation, which calculates the average precision
    by interpolating the precision-recall curve at 101 evenly spaced recall levels from 0 to 1
    for each IOU threshold specified in `iou_thresholds`. The final mAPAveragedOverIOUs value is
    obtained by averaging these AP values across all specified IOU thresholds and all class labels.

    Parameters
    ----------
    value : float
        The average precision value averaged over the specified IOU thresholds.
    iou_thresholds : list[float]
        The list of IOU thresholds used to compute the AP values.

    Returns
    -------
    Metric
    """
    return cls(
        type=MetricType.mAPAveragedOverIOUs.value,
        value=value,
        parameters={
            "iou_thresholds": iou_thresholds,
        },
    )

`mean_average_recall(value, score_threshold, iou_thresholds)` `classmethod`

Mean Average Recall (mAR) metric for object detection tasks.

The mAR computation considers detections with confidence scores above the specified score_threshold and calculates recall at each IOU threshold in iou_thresholds for each label. The final mAR value is obtained by averaging these recall values over the specified IOU thresholds and then averaging across all labels.

Parameters:

Name	Type	Description	Default
`value`	`float`	The mean average recall value averaged over the specified IOU thresholds.	required
`score_threshold`	`float`	The detection score threshold; only detections with confidence scores above this threshold are considered.	required
`iou_thresholds`	`list[float]`	The list of IOU thresholds used to compute the recall values.	required

Returns:

Type	Description
`Metric`

Source code in valor_lite/object_detection/metric.py

@classmethod
def mean_average_recall(
    cls,
    value: float,
    score_threshold: float,
    iou_thresholds: list[float],
):
    """
    Mean Average Recall (mAR) metric for object detection tasks.

    The mAR computation considers detections with confidence scores above the specified
    `score_threshold` and calculates recall at each IOU threshold in `iou_thresholds` for
    each label. The final mAR value is obtained by averaging these recall values over the
    specified IOU thresholds and then averaging across all labels.

    Parameters
    ----------
    value : float
        The mean average recall value averaged over the specified IOU thresholds.
    score_threshold : float
        The detection score threshold; only detections with confidence scores above this
        threshold are considered.
    iou_thresholds : list[float]
        The list of IOU thresholds used to compute the recall values.

    Returns
    -------
    Metric
    """
    return cls(
        type=MetricType.mAR.value,
        value=value,
        parameters={
            "iou_thresholds": iou_thresholds,
            "score_threshold": score_threshold,
        },
    )

`mean_average_recall_averaged_over_scores(value, score_thresholds, iou_thresholds)` `classmethod`

Mean Average Recall (mAR) metric averaged over multiple score thresholds and IOU thresholds.

The mAR computation considers detections across multiple score_thresholds, calculates recall at each IOU threshold in iou_thresholds for each label, averages these recall values over all specified score thresholds and IOU thresholds, and then computes the mean across all labels to obtain the final mAR value.

Parameters:

Name	Type	Description	Default
`value`	`float`	The mean average recall value averaged over the specified score thresholds and IOU thresholds.	required
`score_thresholds`	`list[float]`	The list of detection score thresholds; detections with confidence scores above each threshold are considered.	required
`iou_thresholds`	`list[float]`	The list of IOU thresholds used to compute the recall values.	required

Returns:

Type	Description
`Metric`

Source code in valor_lite/object_detection/metric.py

@classmethod
def mean_average_recall_averaged_over_scores(
    cls,
    value: float,
    score_thresholds: list[float],
    iou_thresholds: list[float],
):
    """
    Mean Average Recall (mAR) metric averaged over multiple score thresholds and IOU thresholds.

    The mAR computation considers detections across multiple `score_thresholds`, calculates recall
    at each IOU threshold in `iou_thresholds` for each label, averages these recall values over all
    specified score thresholds and IOU thresholds, and then computes the mean across all labels to
    obtain the final mAR value.

    Parameters
    ----------
    value : float
        The mean average recall value averaged over the specified score thresholds and IOU thresholds.
    score_thresholds : list[float]
        The list of detection score thresholds; detections with confidence scores above each threshold are considered.
    iou_thresholds : list[float]
        The list of IOU thresholds used to compute the recall values.

    Returns
    -------
    Metric
    """
    return cls(
        type=MetricType.mARAveragedOverScores.value,
        value=value,
        parameters={
            "iou_thresholds": iou_thresholds,
            "score_thresholds": score_thresholds,
        },
    )

`precision(value, label, iou_threshold, score_threshold)` `classmethod`

Precision metric for a specific class label in object detection.

This class encapsulates a metric value for a particular class label, along with the associated Intersection over Union (IOU) threshold and confidence score threshold.

Parameters:

Name	Type	Description	Default
`value`	`float`	The metric value.	required
`label`	`str`	The class label for which the metric is calculated.	required
`iou_threshold`	`float`	The IOU threshold used to determine matches between predicted and ground truth boxes.	required
`score_threshold`	`float`	The confidence score threshold above which predictions are considered.	required

Returns:

Type	Description
`Metric`

Source code in valor_lite/object_detection/metric.py

@classmethod
def precision(
    cls,
    value: float,
    label: str,
    iou_threshold: float,
    score_threshold: float,
):
    """
    Precision metric for a specific class label in object detection.

    This class encapsulates a metric value for a particular class label,
    along with the associated Intersection over Union (IOU) threshold and
    confidence score threshold.

    Parameters
    ----------
    value : float
        The metric value.
    label : str
        The class label for which the metric is calculated.
    iou_threshold : float
        The IOU threshold used to determine matches between predicted and ground truth boxes.
    score_threshold : float
        The confidence score threshold above which predictions are considered.

    Returns
    -------
    Metric
    """
    return cls(
        type=MetricType.Precision.value,
        value=value,
        parameters={
            "label": label,
            "iou_threshold": iou_threshold,
            "score_threshold": score_threshold,
        },
    )

`precision_recall_curve(precisions, scores, iou_threshold, label)` `classmethod`

Interpolated precision-recall curve over 101 recall points.

The precision values are interpolated over recalls ranging from 0.0 to 1.0 in steps of 0.01, resulting in 101 points. This is a byproduct of the 101-point interpolation used in calculating the Average Precision (AP) metric in object detection tasks.

Parameters:

Name	Type	Description	Default
`precisions`	`list[float]`	Interpolated precision values corresponding to recalls at 0.0, 0.01, ..., 1.0.	required
`scores`	`list[float]`	Maximum prediction score for each point on the interpolated curve.	required
`iou_threshold`	`float`	The Intersection over Union (IOU) threshold used to determine true positives.	required
`label`	`str`	The class label associated with this precision-recall curve.	required

Returns:

Type	Description
`Metric`

Source code in valor_lite/object_detection/metric.py

@classmethod
def precision_recall_curve(
    cls,
    precisions: list[float],
    scores: list[float],
    iou_threshold: float,
    label: str,
):
    """
    Interpolated precision-recall curve over 101 recall points.

    The precision values are interpolated over recalls ranging from 0.0 to 1.0 in steps of 0.01,
    resulting in 101 points. This is a byproduct of the 101-point interpolation used in calculating
    the Average Precision (AP) metric in object detection tasks.

    Parameters
    ----------
    precisions : list[float]
        Interpolated precision values corresponding to recalls at 0.0, 0.01, ..., 1.0.
    scores : list[float]
        Maximum prediction score for each point on the interpolated curve.
    iou_threshold : float
        The Intersection over Union (IOU) threshold used to determine true positives.
    label : str
        The class label associated with this precision-recall curve.

    Returns
    -------
    Metric
    """
    return cls(
        type=MetricType.PrecisionRecallCurve.value,
        value={
            "precisions": precisions,
            "scores": scores,
        },
        parameters={
            "iou_threshold": iou_threshold,
            "label": label,
        },
    )

`recall(value, label, iou_threshold, score_threshold)` `classmethod`

Recall metric for a specific class label in object detection.

This class encapsulates a metric value for a particular class label, along with the associated Intersection over Union (IOU) threshold and confidence score threshold.

Parameters:

Name	Type	Description	Default
`value`	`float`	The metric value.	required
`label`	`str`	The class label for which the metric is calculated.	required
`iou_threshold`	`float`	The IOU threshold used to determine matches between predicted and ground truth boxes.	required
`score_threshold`	`float`	The confidence score threshold above which predictions are considered.	required

Returns:

Type	Description
`Metric`

Source code in valor_lite/object_detection/metric.py

@classmethod
def recall(
    cls,
    value: float,
    label: str,
    iou_threshold: float,
    score_threshold: float,
):
    """
    Recall metric for a specific class label in object detection.

    This class encapsulates a metric value for a particular class label,
    along with the associated Intersection over Union (IOU) threshold and
    confidence score threshold.

    Parameters
    ----------
    value : float
        The metric value.
    label : str
        The class label for which the metric is calculated.
    iou_threshold : float
        The IOU threshold used to determine matches between predicted and ground truth boxes.
    score_threshold : float
        The confidence score threshold above which predictions are considered.

    Returns
    -------
    Metric
    """
    return cls(
        type=MetricType.Recall.value,
        value=value,
        parameters={
            "label": label,
            "iou_threshold": iou_threshold,
            "score_threshold": score_threshold,
        },
    )

Metrics

Metric dataclass

average_precision(value, iou_threshold, label) classmethod

average_precision_averaged_over_IOUs(value, iou_thresholds, label) classmethod

average_recall(value, score_threshold, iou_thresholds, label) classmethod

average_recall_averaged_over_scores(value, score_thresholds, iou_thresholds, label) classmethod

confusion_matrix(confusion_matrix, unmatched_predictions, unmatched_ground_truths, score_threshold, iou_threshold) classmethod

counts(tp, fp, fn, label, iou_threshold, score_threshold) classmethod

f1_score(value, label, iou_threshold, score_threshold) classmethod

mean_average_precision(value, iou_threshold) classmethod

mean_average_precision_averaged_over_IOUs(value, iou_thresholds) classmethod

mean_average_recall(value, score_threshold, iou_thresholds) classmethod

mean_average_recall_averaged_over_scores(value, score_thresholds, iou_thresholds) classmethod

precision(value, label, iou_threshold, score_threshold) classmethod

precision_recall_curve(precisions, scores, iou_threshold, label) classmethod

recall(value, label, iou_threshold, score_threshold) classmethod

References

`Metric` `dataclass`

`average_precision(value, iou_threshold, label)` `classmethod`

`average_precision_averaged_over_IOUs(value, iou_thresholds, label)` `classmethod`

`average_recall(value, score_threshold, iou_thresholds, label)` `classmethod`

`average_recall_averaged_over_scores(value, score_thresholds, iou_thresholds, label)` `classmethod`

`confusion_matrix(confusion_matrix, unmatched_predictions, unmatched_ground_truths, score_threshold, iou_threshold)` `classmethod`

`counts(tp, fp, fn, label, iou_threshold, score_threshold)` `classmethod`

`f1_score(value, label, iou_threshold, score_threshold)` `classmethod`

`mean_average_precision(value, iou_threshold)` `classmethod`

`mean_average_precision_averaged_over_IOUs(value, iou_thresholds)` `classmethod`

`mean_average_recall(value, score_threshold, iou_thresholds)` `classmethod`

`mean_average_recall_averaged_over_scores(value, score_thresholds, iou_thresholds)` `classmethod`

`precision(value, label, iou_threshold, score_threshold)` `classmethod`

`precision_recall_curve(precisions, scores, iou_threshold, label)` `classmethod`

`recall(value, label, iou_threshold, score_threshold)` `classmethod`