Source code for pygod.utils.metric

# -*- coding: utf-8 -*-
"""
Metrics used to evaluate the anomaly detection performance
"""
# Author: Yingtong Dou <ytongdou@gmail.com>
# License: BSD 2 clause

from sklearn.metrics import roc_auc_score, average_precision_score


[docs]def eval_roc_auc(labels, pred):
    """
    ROC-AUC score for binary classification.

    Parameters
    ----------
    labels : numpy.array
        Labels in shape of ``(N, )``, where 1 represents outliers,
        0 represents normal instances.
    pred : numpy.array
        Outlier scores in shape of ``(N, )``.

    Returns
    -------
    roc_auc : float
        Average ROC-AUC score across different labels.
    """

    # outlier detection is a binary classification problem
    roc_auc = roc_auc_score(y_true=labels, y_score=pred)
    return roc_auc


[docs]def eval_recall_at_k(labels, pred, k, threshold=0.5):
    """
    Recall score for top k instances with the highest outlier scores.

    Parameters
    ----------
    labels : numpy.array
        Labels in shape of ``(N, )``, where 1 represents outliers,
        0 represents normal instances.
    pred : numpy.array
        Outlier scores in shape of ``(N, )``.
    k : int
        The number of instances to evaluate.
    threshold : float
        The binary classification threshold.

    Returns
    -------
    recall_at_k : float
        Recall for top k instances with the highest outlier scores.
    """

    scores = [(s, l) for s, l in zip(pred, labels)]
    scores.sort(reverse=True, key=lambda x: x[0])

    # Number of true outliers
    n_true = sum(l for (_, l) in scores)

    # Number of true positive instances in top k
    n_true_and_pred_k = sum((l and (s >= threshold)) for (s, l) in scores[:k])

    recall_at_k = n_true_and_pred_k / n_true if n_true != 0 else 0.0

    return recall_at_k


[docs]def eval_precision_at_k(labels, pred, k, threshold=0.5):
    """
    Precision score for top k instances with the highest outlier scores.

    Parameters
    ----------
    labels : numpy.array
        Labels in shape of ``(N, )``, where 1 represents outliers,
        0 represents normal instances.
    pred : numpy.array
        Outlier scores in shape of ``(N, )``.
    k : int
        The number of instances to evaluate.
    threshold : float
        The binary classification threshold.

    Returns
    -------
    precision_at_k : float
        Precision for top k instances with the highest outlier scores.
    """

    scores = [(s, l) for s, l in zip(pred, labels)]
    scores.sort(reverse=True, key=lambda x: x[0])

    # Number of predicted outliers in top k
    n_pred_k = sum((s >= threshold) for (s, _) in scores[:k])

    # Number of true positive instances in top k
    n_true_and_pred_k = sum((l and (s >= threshold)) for (s, l) in scores[:k])

    precision_at_k = n_true_and_pred_k / n_pred_k if n_pred_k != 0 else 0.0

    return precision_at_k


[docs]def eval_average_precision(labels, pred):
    """
    Average precision score for binary classification.

    Parameters
    ----------
    labels : numpy.array
        Labels in shape of ``(N, )``, where 1 represents outliers,
        0 represents normal instances.
    pred : numpy.array
        Outlier scores in shape of ``(N, )``.

    Returns
    -------
    ap : float
        Average precision score.
    """

    # outlier detection is a binary classification problem
    ap = average_precision_score(y_true=labels, y_score=pred)
    return ap