Source code for dmae.metrics

# -*- coding: utf-8 -*-
"""
The :mod:`dmae.metrics` module implements some evaluation metrics that are used
in the paper.
"""
# Author: Juan S. Lara <julara@unal.edu.co>
# License: MIT

import numpy as _np
from scipy.optimize import linear_sum_assignment as _linear_sum_assignment

[docs]def unsupervised_classification_accuracy(y_true, y_pred):
    """

    Scipy-based implementation of the unsupervised classification accuracy.

    Parameters
    ----------
    y_true: array-like, shape=(n_samples, )
        Array with the Ground truth labels.
    y_pred: array-like, shape=(n_samples, )
        Array with the predicted labels.

    Returns
    -------
    uacc: float
        Unsupervised classification accuracy between y_true and y_pred.
    """
    
    D = max(y_pred.max(), y_true.max()) + 1
    w = _np.zeros((D, D), dtype=_np.int64)

    for i in range(y_pred.size):
        w[y_pred[i], y_true[i]] += 1

    ind = _np.array(
            _linear_sum_assignment(
                w.max() - w
                )
            ).T

    return sum([w[i, j] for i, j in ind])*1.0/y_pred.size

[docs]def zero_norm(preds, thr=1e-7):
    """
    Numpy implementation of the L0 norm.

    Parameters
    ----------
    preds: array-like, shape=(n_samples, n_clusters)
        Soft-assignments extracted from a DM-Encoder
    thr: float
        Threshold used to compute the L0 norm.

    Returns
    -------
    L0: float
        L0 norm of the soft-assignments.
    """
    
    counts = (preds>thr).astype("float32").sum(axis=1)
    return counts