Source code for xcolumns.confusion_matrix

from typing import Optional, Union

import numpy as np
from scipy.sparse import csr_matrix

from .numba_csr_functions import *
from .types import *
from .utils import *


########################################################################################
# Confusion matrix class
########################################################################################



[docs]
class ConfusionMatrix:
    """
    Class representing a confusion matrix,
    containing counts or ratios of true positives, false positives, false negatives, and true negatives.
    Implements basic operations for confusion matrices such as comparison, addition, subtraction, multiplication, and division.

    Additionally, it can be unpacked into a tuple of counts or ratios (tp, fp, fn, tn) (in this order).
    So it can be used with metric functions that expect tp, fp, fn, and tn as separate arguments.
    """

    def __init__(
        self,
        tp: Union[Number, DenseMatrix],
        fp: Union[Number, DenseMatrix],
        fn: Union[Number, DenseMatrix],
        tn: Union[Number, DenseMatrix],
    ):
        self.tp = tp
        self.fp = fp
        self.fn = fn
        self.tn = tn

    # For compatibility with methods that expect a tuple
    def __iter__(self):
        yield self.tp
        yield self.fp
        yield self.fn
        yield self.tn

    def __eq__(self, other: object) -> bool:
        if not isinstance(other, ConfusionMatrix):
            return False

        if isinstance(self.tp, Number):
            return (
                self.tp == other.tp
                and self.fp == other.fp
                and self.fn == other.fn
                and self.tn == other.tn
            )
        elif isinstance(self.tp, DenseMatrix):
            return (
                (self.tp == other.tp).all()
                and (self.fp == other.fp).all()
                and (self.fn == other.fn).all()
                and (self.tn == other.tn).all()
            )

    def __add__(self, other: "ConfusionMatrix") -> "ConfusionMatrix":
        return ConfusionMatrix(
            self.tp + other.tp,
            self.fp + other.fp,
            self.fn + other.fn,
            self.tn + other.tn,
        )

    def __iadd__(self, other: "ConfusionMatrix") -> "ConfusionMatrix":
        self.tp += other.tp
        self.fp += other.fp
        self.fn += other.fn
        self.tn += other.tn
        return self

    def __sub__(self, other: "ConfusionMatrix") -> "ConfusionMatrix":
        return ConfusionMatrix(
            self.tp - other.tp,
            self.fp - other.fp,
            self.fn - other.fn,
            self.tn - other.tn,
        )

    def __isub__(self, other: "ConfusionMatrix") -> "ConfusionMatrix":
        self.tp -= other.tp
        self.fp -= other.fp
        self.fn -= other.fn
        self.tn -= other.tn
        return self

    def __mul__(self, other: Union[Number, DenseMatrix]) -> "ConfusionMatrix":
        return ConfusionMatrix(
            self.tp * other,
            self.fp * other,
            self.fn * other,
            self.tn * other,
        )

    def __imul__(self, other: Union[Number, DenseMatrix]) -> "ConfusionMatrix":
        self.tp *= other
        self.fp *= other
        self.fn *= other
        self.tn *= other
        return self

    def __truediv__(self, other: Union[Number, DenseMatrix]) -> "ConfusionMatrix":
        return ConfusionMatrix(
            self.tp / other,
            self.fp / other,
            self.fn / other,
            self.tn / other,
        )

    def __itruediv__(self, other: Union[Number, DenseMatrix]) -> "ConfusionMatrix":
        self.tp /= other
        self.fp /= other
        self.fn /= other
        self.tn /= other
        return self

    def __floordiv__(self, other: Union[Number, DenseMatrix]) -> "ConfusionMatrix":
        return ConfusionMatrix(
            self.tp // other,
            self.fp // other,
            self.fn // other,
            self.tn // other,
        )

    def __ifloordiv__(self, other: Union[Number, DenseMatrix]) -> "ConfusionMatrix":
        self.tp //= other
        self.fp //= other
        self.fn //= other
        self.tn //= other
        return self


[docs]
    def normalize(self) -> "ConfusionMatrix":
        """
        Normalize the confusion matrix, resulting the rates instead of counts.

        Returns:
            The normalized confusion matrix.
        """
        entries_sum = self.tp + self.fp + self.fn + self.tn
        return ConfusionMatrix(
            self.tp / entries_sum,
            self.fp / entries_sum,
            self.fn / entries_sum,
            self.tn / entries_sum,
        )




########################################################################################
# Functions to calculate/update confusion matrix
########################################################################################


def _calculate_tp_dense(
    y_true: DenseMatrix,
    y_pred: DenseMatrix,
    axis: int = 0,
    dtype: Optional[DType] = None,
) -> DenseMatrix:
    return np.sum(y_true * y_pred, axis=axis, dtype=dtype)


# Alternative version, performance is similar
# def _calculate_tp_csr(y_true: csr_matrix, y_pred: csr_matrix, axis=0) -> np.ndarray:
#     return (y_pred.multiply(y_true)).sum(axis=axis)


def _calculate_tp_csr(
    y_true: csr_matrix, y_pred: csr_matrix, axis: int = 0, dtype: Optional[DType] = None
) -> np.ndarray:
    n, m = y_true.shape
    return numba_calculate_sum_csr_mat_mul_mat(
        *unpack_csr_matrices(y_pred, y_true),
        n,
        m,
        axis=axis,
        dtype=dtype if dtype else y_true.dtype,
    )


def _calculate_fp_dense(
    y_true: DenseMatrix,
    y_pred: DenseMatrix,
    axis: int = 0,
    dtype: Optional[DType] = None,
) -> DenseMatrix:
    return np.sum((1 - y_true) * y_pred, axis=axis, dtype=dtype)


def _calculate_fn_dense(
    y_true: DenseMatrix,
    y_pred: DenseMatrix,
    axis: int = 0,
    dtype: Optional[DType] = None,
) -> DenseMatrix:
    return np.sum(y_true * (1 - y_pred), axis=axis, dtype=dtype)


def _calculate_fp_csr(
    y_true: csr_matrix, y_pred: csr_matrix, axis: int = 0, dtype: Optional[DType] = None
) -> np.ndarray:
    n, m = y_true.shape
    return numba_calculate_sum_csr_mat_mul_ones_minus_mat(
        *unpack_csr_matrices(y_pred, y_true),
        n,
        m,
        axis=axis,
        dtype=dtype if dtype else y_true.dtype,
    )


def _calculate_fn_csr(
    y_true: csr_matrix, y_pred: csr_matrix, axis: int = 0, dtype: Optional[DType] = None
) -> np.ndarray:
    n, m = y_true.shape
    return numba_calculate_sum_csr_mat_mul_ones_minus_mat(
        *unpack_csr_matrices(y_true, y_pred),
        n,
        m,
        axis=axis,
        dtype=dtype if dtype else y_true.dtype,
    )


def _calculate_tn_dense(
    y_true: np.ndarray, y_pred: np.ndarray, axis: int = 0, dtype: Optional[DType] = None
) -> np.ndarray:
    return np.sum((1 - y_true) * (1 - y_pred), axis=axis, dtype=dtype)


def _calculate_conf_mat_entry(
    y_true: Matrix,
    y_pred: Matrix,
    func_for_dense: Callable,
    func_for_csr: Callable,
    normalize: bool = False,
    axis: Optional[int] = 0,
    dtype: Optional[DType] = None,
) -> DenseMatrix:
    """ """

    if isinstance(y_true, DenseMatrix) and isinstance(y_pred, DenseMatrix):
        func = func_for_dense
    elif isinstance(y_true, csr_matrix) and isinstance(y_pred, csr_matrix):
        func = func_for_csr
    else:
        raise ValueError(
            "y_true and y_pred must be both np.ndarray, both torch.Tensor, or csr_matrix"
        )

    if y_true.shape != y_pred.shape:
        raise ValueError("y_true and y_pred must have the same shape")

    if axis not in (0, 1):
        raise ValueError("axis must be 0 or 1")

    val = func(y_true, y_pred, axis=axis, dtype=dtype)

    if normalize:
        val = val / y_true.shape[0]

    return val



[docs]
def calculate_tp(
    y_true: Matrix,
    y_pred: Matrix,
    normalize: bool = False,
    axis: Optional[int] = 0,
    dtype: Optional[DType] = None,
) -> Union[Number, DenseMatrix]:
    """
    Calculate number of true positives for the given true and predicted labels along an axis.

    Args:
        y_true: The true labels.
        y_pred: The predicted labels.
        normalize: Whether to normalize the confusion matrix, resulting the rates instead of counts.
        axis: The axis along which to calculate the confusion matrix.
        dtype: The data type of the output, if None, the same as y_true.

    Returns:
        The number of vector of false positives counts or rates.
    """
    return _calculate_conf_mat_entry(
        y_true,
        y_pred,
        _calculate_tp_dense,
        _calculate_tp_csr,
        normalize=normalize,
        axis=axis,
        dtype=dtype,
    )




[docs]
def calculate_fp(
    y_true: Matrix,
    y_pred: Matrix,
    normalize: bool = False,
    axis: Optional[int] = 0,
    dtype: Optional[DType] = None,
) -> Union[Number, DenseMatrix]:
    """
    Calculate number of false positives for the given true and predicted labels along an axis.

    Args:
        y_true: The true labels.
        y_pred: The predicted labels.
        normalize: Whether to normalize the confusion matrix, resulting the rates instead of counts.
        axis: The axis along which to calculate the confusion matrix.
        dtype: The data type of the output, if None, the same as y_true.

    Returns:
        The number of vector of false positives counts or rates.
    """
    return _calculate_conf_mat_entry(
        y_true,
        y_pred,
        _calculate_fp_dense,
        _calculate_fp_csr,
        normalize=normalize,
        axis=axis,
        dtype=dtype,
    )




[docs]
def calculate_fn(
    y_true: Matrix,
    y_pred: Matrix,
    normalize: bool = False,
    axis: Optional[int] = 0,
    dtype: Optional[DType] = None,
) -> Union[Number, DenseMatrix]:
    """
    Calculate number of false negatives for the given true and predicted labels along an axis.

    Args:
        y_true: The true labels.
        y_pred: The predicted labels.
        normalize: Whether to normalize the confusion matrix, resulting the rates instead of counts.
        axis: The axis along which to calculate the confusion matrix.
        dtype: The data type of the output, if None, the same as y_true.

    Returns:
        The number of vector of false negatives counts or rates.
    """
    return _calculate_conf_mat_entry(
        y_true,
        y_pred,
        _calculate_fn_dense,
        _calculate_fn_csr,
        normalize=normalize,
        axis=axis,
        dtype=dtype,
    )




[docs]
def calculate_confusion_matrix(
    y_true: Matrix,
    y_pred: Matrix,
    normalize: bool = False,
    skip_tn: bool = False,
    axis: Optional[int] = 0,
    dtype: Optional[DType] = None,
) -> ConfusionMatrix:
    """
    Calculate confusion matrix for given true and predicted labels along an axis.

    Args:
        y_true: The true labels.
        y_pred: The predicted labels.
        normalize: Whether to normalize the confusion matrix, resulting the rates instead of counts.
        skip_tn: Whether to skip calculating true negatives, as they may not be always needed.
        axis: The axis along which to calculate the confusion matrix.
        dtype: The data type of the output, if None, the same as y_true.

    Returns:
        The confusion matrix.
    """
    tp = calculate_tp(y_true, y_pred, normalize=normalize, axis=axis, dtype=dtype)
    fp = calculate_fp(y_true, y_pred, normalize=normalize, axis=axis, dtype=dtype)
    fn = calculate_fn(y_true, y_pred, normalize=normalize, axis=axis, dtype=dtype)

    n, m = y_true.shape
    if skip_tn:
        tn = tp.copy()
        tn[:] = -1
    else:
        # It is faster to calculate tn from tp, fp, and fn

        tn = -tp - fp - fn + (1.0 if normalize else (n if axis == 0 else m))

    return ConfusionMatrix(tp, fp, fn, tn)



def _update_unnormalized_confusion_matrix(
    C: ConfusionMatrix,
    y_true: Matrix,
    y_pred: Matrix,
    skip_tn: bool = False,
) -> None:
    """
    Updates the given unnormalized confusion matrix in place based on provided true and predicted labels for a single instance.
    """
    if y_true.shape != y_pred.shape:
        raise ValueError("y_true and y_pred must have the same shape")

    if isinstance(y_true, DenseMatrix) and isinstance(y_pred, DenseMatrix):
        C.tp += y_true * y_pred
        C.fp += (1 - y_true) * y_pred
        C.fn += y_true * (1 - y_pred)
        if not skip_tn:
            C.tn += (1 - y_true) * (1 - y_pred)
    elif isinstance(y_true, csr_matrix) and isinstance(y_pred, csr_matrix):
        numba_add_to_unnormalized_confusion_matrix_csr(
            C.tp,
            C.fp,
            C.fn,
            C.tn,
            y_true.data,
            y_true.indices,
            y_pred.data,
            y_pred.indices,
            skip_tn=skip_tn,
        )
    else:
        raise ValueError(
            "y_true and y_pred must be both np.ndarray, both torch.Tensor, or both csr_matrix"
        )