Source code for osl_dynamics.inference.metrics

"""Metrics for evaluating model performance."""

import numpy as np
from scipy.linalg import eigvalsh
from sklearn.metrics import confusion_matrix as sklearn_confusion_matrix
from tqdm.auto import trange



[docs]
def alpha_correlation(alpha_1: np.ndarray, alpha_2: np.ndarray) -> np.ndarray:
    """Calculates the correlation between mixing coefficient time series.

    Parameters
    ----------
    alpha_1 : np.ndarray
        First alpha time series. Shape must be (n_samples, n_modes).
    alpha_2 : np.ndarray
        Second alpha time series. Shape must be (n_samples, n_modes).

    Returns
    -------
    corr : np.ndarray
        Correlation of each mode in the corresponding alphas.
        Shape is (n_modes,).
    """
    if alpha_1.shape[1] != alpha_2.shape[1]:
        raise ValueError(
            "alpha_1 and alpha_2 shapes are incompatible. "
            f"alpha_1.shape={alpha_1.shape}, alpha_2.shape={alpha_2.shape}."
        )
    n_modes = alpha_1.shape[1]
    corr = np.corrcoef(alpha_1, alpha_2, rowvar=False)
    corr = np.diagonal(corr[:n_modes, n_modes:])
    return corr




[docs]
def confusion_matrix(
    state_time_course_1: np.ndarray, state_time_course_2: np.ndarray
) -> np.ndarray:
    """Calculate the `confusion_matrix \
    <https://scikit-learn.org/stable/modules/generated/\
    sklearn.metrics.confusion_matrix.html>`_ of two state time courses.

    For two state time courses, calculate the confusion matrix (i.e. the
    disagreement between the state selection for each sample). If either
    sequence is two dimensional, it will first have :code:`argmax(axis=1)`
    applied to it. The produces the expected result for a one-hot encoded
    sequence but other inputs are not guaranteed to behave.

    Parameters
    ----------
    state_time_course_1 : np.ndarray
        Mode time course. Shape must be (n_samples, n_states) or (n_samples,).
    state_time_course_2 : np.ndarray
        Mode time course. Shape must be (n_samples, n_states) or (n_samples,).

    Returns
    -------
    cm : np.ndarray
        Confusion matrix. Shape is (n_states, n_states).
    """
    if state_time_course_1.ndim == 2:
        state_time_course_1 = state_time_course_1.argmax(axis=1)
    if state_time_course_2.ndim == 2:
        state_time_course_2 = state_time_course_2.argmax(axis=1)
    if not ((state_time_course_1.ndim == 1) and (state_time_course_2.ndim == 1)):
        raise ValueError("Both state time courses must be either 1D or 2D.")
    return sklearn_confusion_matrix(state_time_course_1, state_time_course_2)




[docs]
def dice_coefficient(sequence_1: np.ndarray, sequence_2: np.ndarray) -> float:
    """Calculates the Dice coefficient.

    The Dice coefficient is 2 times the number of equal elements (equivalent to
    true-positives) divided by the sum of the total number of elements.

    Parameters
    ----------
    sequence_1 : np.ndarray
        A sequence containing either 1D discrete or 2D continuous data.
        Shape must be (n_samples, n_states) or (n_samples,).
    sequence_2 : np.ndarray
        A sequence containing either 1D discrete or 2D continuous data.
        Shape must be (n_samples, n_states) or (n_samples,).

    Returns
    -------
    dice : float
        The Dice coefficient of the two sequences.
    """
    if (sequence_1.ndim not in [1, 2]) or (sequence_2.ndim not in [1, 2]):
        raise ValueError("Both sequences must be either 1D or 2D")
    if sequence_1.ndim == 2:
        sequence_1 = sequence_1.argmax(axis=1)
    if sequence_2.ndim == 2:
        sequence_2 = sequence_2.argmax(axis=1)
    return 2 * ((sequence_1 == sequence_2).sum()) / (len(sequence_1) + len(sequence_2))




[docs]
def frobenius_norm(A: np.ndarray, B: np.ndarray) -> float:
    r"""Calculates the Frobenius norm of the difference of two matrices.

    The Frobenius norm is calculated as
    :math:`\sqrt{\displaystyle\sum_{ij} |a_{ij} - b_{ij}|^2}`.

    Parameters
    ----------
    A : np.ndarray
        First matrix. Shape must be (n_modes, n_channels, n_channels) or
        (n_channels, n_channels).
    B : np.ndarray
        Second matrix. Shape must be (n_modes, n_channels, n_channels) or
        (n_channels, n_channels)`.

    Returns
    -------
    norm : float
        The Frobenius norm of the difference of :code:`A` and :code:`B`.
        If :code:`A` and :code:`B` are stacked matrices, we sum the Frobenius
        norm of each sub-matrix.
    """
    if A.ndim == 2 and B.ndim == 2:
        norm = np.linalg.norm(A - B, ord="fro")
    elif A.ndim == 3 and B.ndim == 3:
        norm = np.linalg.norm(A - B, ord="fro", axis=(1, 2))
        norm = np.sum(norm)
    else:
        raise ValueError(
            f"Shape of A and/or B is incorrect. A.shape={A.shape}, B.shape={B.shape}."
        )
    return norm




[docs]
def pairwise_frobenius_distance(matrices: np.ndarray) -> np.ndarray:
    """Calculates the pairwise Frobenius distance of a set of matrices.

    Parameters
    ----------
    matrices : np.ndarray
        The set of matrices. Shape must be (n_matrices, n_channels, n_channels).

    Returns
    -------
    pairwise_distance : np.ndarray
        Matrix of pairwise Frobenius distance.
        Shape is (n_matrices, n_matrices).

    See Also
    --------
    frobenius_norm
    """
    return np.sqrt(
        np.sum(
            np.square(
                np.expand_dims(matrices, 0) - np.expand_dims(matrices, 1),
            ),
            axis=(-2, -1),
        )
    )




[docs]
def pairwise_matrix_correlations(
    matrices: np.ndarray, remove_diagonal: bool = False
) -> np.ndarray:
    """Calculate the correlation between (flattened) covariance matrices.

    Parameters
    ----------
    matrices : np.ndarray
        Matrices. Shape must be (M, N, N).
    remove_diagonal : bool, optional
        Should we remove the diagonal before calculating the correction?

    Returns
    -------
    correlations : np.ndarray
        Pairwise Pearson correlation between elements of each flattened matrix.
        Shape is (M, M).
    """
    n_matrices = matrices.shape[0]
    matrices = matrices.reshape(n_matrices, -1)
    correlations = np.corrcoef(matrices)
    if remove_diagonal:
        correlations -= np.eye(n_matrices)
    return correlations




[docs]
def riemannian_distance(
    M1: np.ndarray, M2: np.ndarray, threshold: float = 1e-3
) -> float:
    r"""Calculate the Riemannian distance between two matrices.

    The Riemannian distance is defined as
    :math:`d = \sqrt{\displaystyle\sum \log(\mathrm{eig}(M_1 * M_2))}`.

    Parameters
    ----------
    M1 : np.ndarray
        First matrix. Shape must be (N, N).
    M2 : np.ndarray
        Second matrix. Shape must be (N, N).
    threshold : float, optional
        Threshold to apply when there are negative eigenvalues.
        Must be positive.

    Returns
    -------
    d : float
        Riemannian distance.
    """
    eigvals = eigvalsh(M1, M2, driver="gv")
    if np.any(eigvals < 0):
        eigvals = np.maximum(eigvals, threshold)

    d = np.sqrt((np.log(eigvals) ** 2).sum())
    return d




[docs]
def pairwise_riemannian_distances(
    matrices: np.ndarray, threshold: float = 1e-3
) -> np.ndarray:
    """Calculate the Riemannian distance between matrices.

    Parameters
    ----------
    matrices : np.ndarray
        Matrices. Shape must be (M, N, N).
    threshold : float, optional
        Threshold to apply when there are negative eigenvalues.
        Must be positive.

    Returns
    -------
    riemannian_distances : np.ndarray
        Matrix containing the pairwise Riemannian distances between matrices.
        Shape is (M, M).

    See Also
    --------
    riemannian_distance
    """
    matrices.astype(np.float64)
    n_matrices = matrices.shape[0]
    riemannian_distances = np.zeros([n_matrices, n_matrices])
    for i in trange(n_matrices, desc="Computing Riemannian distances"):
        for j in range(i + 1, n_matrices):
            riemannian_distances[i][j] = riemannian_distance(
                matrices[i], matrices[j], threshold=threshold
            )

    # Only the upper triangular entries are filled,
    # the diagonal entries are zeros
    riemannian_distances = riemannian_distances + riemannian_distances.T

    return riemannian_distances




[docs]
def pairwise_rv_coefficient(
    matrices: np.ndarray, remove_diagonal: bool = False
) -> np.ndarray:
    """Calculate the RV coefficient for two matrices.

    Parameters
    ----------
    matrices : np.ndarray
        Set of matrices. Shape must be (M, N, N).
    remove_diagonal : bool, optional
        Should we remove the diagonal before calculating the correction?

    Returns
    -------
    rv_coefficients : np.ndarray
        Matrix of pairwise RV coefficients. Shape is (M, M).
    """
    # First compute the scalar product matrices for each data set X
    scal_arr_list = []
    for arr in matrices:
        scal_arr = np.dot(arr, np.transpose(arr))
        scal_arr_list.append(scal_arr)

    # Now compute the 'between study cosine matrix'
    n_matrices = matrices.shape[0]
    rv_coefficients = np.zeros([n_matrices, n_matrices])

    for index, element in np.ndenumerate(rv_coefficients):
        nom = np.trace(
            np.dot(
                np.transpose(scal_arr_list[index[0]]),
                scal_arr_list[index[1]],
            )
        )
        denom1 = np.trace(
            np.dot(
                np.transpose(scal_arr_list[index[0]]),
                scal_arr_list[index[0]],
            )
        )
        denom2 = np.trace(
            np.dot(
                np.transpose(scal_arr_list[index[1]]),
                scal_arr_list[index[1]],
            )
        )
        Rv = nom / np.sqrt(np.dot(denom1, denom2))
        rv_coefficients[index[0], index[1]] = Rv

    if remove_diagonal:
        rv_coefficients -= np.eye(n_matrices)

    return rv_coefficients




[docs]
def pairwise_congruence_coefficient(
    matrices: np.ndarray, remove_diagonal: bool = False
) -> np.ndarray:
    """Computes the congruence coefficient between matrices.

    Parameters
    ----------
    matrices : np.ndarray
        Set of symmetric semi-positive definite matrices. Shape is (M, N, N).
    remove_diagonal : bool, optional
        Should we remove the diagonal before calculating the correction?

    Returns
    -------
    congruence_coefficient : np.ndarray
        Matrix of pairwise congruence coefficients. Shape is (M, M).
    """

    n_matrices = matrices.shape[0]
    congruence_coefficient = np.zeros([n_matrices, n_matrices])
    for index, element in np.ndenumerate(congruence_coefficient):
        nom = np.trace(
            np.dot(np.transpose(matrices[index[0]]), matrices[index[1]]),
        )
        denom1 = np.trace(
            np.dot(np.transpose(matrices[index[0]]), matrices[index[0]]),
        )
        denom2 = np.trace(
            np.dot(np.transpose(matrices[index[1]]), matrices[index[1]]),
        )
        cc = nom / np.sqrt(np.dot(denom1, denom2))
        congruence_coefficient[index[0], index[1]] = cc

    if remove_diagonal:
        congruence_coefficient -= np.eye(n_matrices)

    return congruence_coefficient




[docs]
def pairwise_l2_distance(arrays: np.ndarray, batch_dims: int = 0) -> np.ndarray:
    """Pairwise L2 distance.

    Calculate the pairwise L2 distance along the first axis after :code:`batch_dims`.

    Parameters
    ----------
    arrays : np.ndarray
        Set of arrays. Shape is (..., n_sessions, ...).
    batch_dims : int, optional
        Number of batch dimensions.

    Returns
    -------
    pairwise_distance : np.ndarray
        Matrix of pairwise L2 distance. Shape is (..., n_sessions, n_sessions).
    """
    if batch_dims > arrays.ndim - 1:
        raise ValueError("batch_dims must be less than arrays.ndim - 1")
    pairwise_axis = batch_dims
    return np.sqrt(
        np.sum(
            np.square(
                np.expand_dims(arrays, pairwise_axis)
                - np.expand_dims(arrays, pairwise_axis + 1)
            ),
            axis=tuple(range(pairwise_axis + 2, arrays.ndim + 1)),
        )
    )