Source code for cerebras_pytorch.metrics.fbeta_score

# Copyright 2016-2023 Cerebras Systems
# SPDX-License-Identifier: BSD-3-Clause

"""
F Beta Score metric for PyTorch.
Confusion matrix calculation in Pytorch referenced from:
https://github.com/pytorch/ignite/blob/master/ignite/metrics/confusion_matrix.py
"""
from typing import List, Optional

import torch

import cerebras_pytorch as cstorch
from cerebras_pytorch.metrics.metric import Metric
from cerebras_pytorch.metrics.utils import (
    compute_confusion_matrix,
    compute_mask,
    divide_no_nan,
)


def compute_helper(
    confusion_matrix,
    mask,
    beta: Optional[float] = 1.0,
    average_type: Optional[str] = "micro",
) -> float:
    """Helper function to compute fbeta score"""

    # true_pos = torch.diagonal(confusion_matrix).to(dtype=torch.float)
    # TODO: Use diagonal op when support is added (SW-91547)
    wgth_id = torch.eye(
        confusion_matrix.shape[0], device=confusion_matrix.device
    )
    true_pos = (wgth_id * confusion_matrix).sum(axis=-1, dtype=torch.float)
    predicted_per_class = confusion_matrix.sum(dim=0).type(torch.float)
    actual_per_class = confusion_matrix.sum(dim=1).type(torch.float)

    mask = cstorch.make_constant(mask)

    num_labels_to_consider = mask.sum()
    beta = torch.tensor(beta).to(torch.float)

    if average_type == "micro":
        precision = divide_no_nan(
            (true_pos * mask).sum(), (predicted_per_class * mask).sum()
        )
        recall = divide_no_nan(
            (true_pos * mask).sum(), (actual_per_class * mask).sum()
        )
        fbeta = divide_no_nan(
            (1.0 + beta ** 2) * precision * recall,
            (beta ** 2) * precision + recall,
        )
    else:  # "macro"
        precision_per_class = divide_no_nan(true_pos, predicted_per_class)
        recall_per_class = divide_no_nan(true_pos, actual_per_class)
        fbeta_per_class = divide_no_nan(
            (1.0 + beta ** 2) * precision_per_class * recall_per_class,
            (beta ** 2) * precision_per_class + recall_per_class,
        )
        precision = (precision_per_class * mask).sum() / num_labels_to_consider
        recall = (recall_per_class * mask).sum() / num_labels_to_consider
        fbeta = (fbeta_per_class * mask).sum() / num_labels_to_consider

    return fbeta


[docs]class FBetaScoreMetric(Metric): """Calculates F Score from labels and predictions. fbeta = (1 + beta^2) * (precision*recall) / ((beta^2 * precision) + recall) Where beta is some positive real factor. Args: num_classes: Number of classes. beta: Beta coefficient in the F measure. average_type: Defines the reduction that is applied. Should be one of the following: - 'micro' [default]: Calculate the metric globally, across all samples and classes. - 'macro': Calculate the metric for each class separately, and average the metrics across classes (with equal weights for each class). This does not take label imbalance into account. ignore_labels: Integer specifying a target classes to ignore. name: Name of the metric """
[docs] def __init__( self, num_classes, beta: float = 1.0, average_type: str = "micro", ignore_labels: Optional[List] = None, name: Optional[str] = None, ): if num_classes <= 1: raise ValueError( f"'num_classes' should be at least 2, got {num_classes}" ) self.num_classes = num_classes with torch.device("cpu"): # We want the mask to be computed on the CPU so that it can be # encoded into the graph as a constant self.mask = compute_mask(num_classes, ignore_labels) super().__init__(name=name) if beta <= 0: raise ValueError(f"'beta' should be a positive number, got {beta}") self.beta = beta allowed_average = ["micro", "macro"] if average_type not in allowed_average: raise ValueError( f"The average_type has to be one of {allowed_average}, " f"got {average_type}." ) self.average_type = average_type
[docs] def reset(self): self.register_state( "confusion_matrix", torch.zeros( (self.num_classes, self.num_classes), dtype=torch.float ), ) self._dtype = None
[docs] def update(self, labels, predictions, dtype=None): if labels.shape != predictions.shape: raise ValueError( f"`labels` and `predictions` have mismatched shapes. " f"Their shapes were {labels.shape} and {predictions.shape} respectively." ) confusion_matrix = compute_confusion_matrix( labels=labels, predictions=predictions, num_classes=self.num_classes, on_device=cstorch.use_cs(), ) self.confusion_matrix.add_(confusion_matrix) self._dtype = dtype
[docs] def compute(self) -> torch.Tensor: fbeta = compute_helper( self.confusion_matrix, self.mask, beta=self.beta, average_type=self.average_type, ) if self._dtype is not None: fbeta = fbeta.to(self._dtype) return fbeta