Source code for mapie.conformity_scores.sets.topk

from typing import Optional, Union, cast

import numpy as np
from numpy.typing import NDArray
from sklearn.model_selection import BaseCrossValidator

from mapie._machine_precision import EPSILON
from mapie.conformity_scores.classification import BaseClassificationScore
from mapie.conformity_scores.sets.utils import get_true_label_position
from mapie.utils import _compute_quantiles


[docs] class TopKConformityScore(BaseClassificationScore): """ Top-K method-based non-conformity score. It is based on the sorted index of the probability of the true label in the softmax outputs, on the conformalization set. In case two probabilities are equal, both are taken, thus, the size of some prediction sets may be different from the others. References ---------- [1] Anastasios Nikolas Angelopoulos, Stephen Bates, Michael Jordan and Jitendra Malik. "Uncertainty Sets for Image Classifiers using Conformal Prediction." International Conference on Learning Representations 2021. Attributes ---------- classes: Optional[ArrayLike] Names of the classes. random_state: Optional[Union[int, np.random.RandomState]] Pseudo random number generator state. quantiles_: ArrayLike of shape (n_alpha) The quantiles estimated from ``get_sets`` method. """
[docs] def __init__(self) -> None: super().__init__()
[docs] def get_conformity_scores( self, y: NDArray, y_pred: NDArray, y_enc: Optional[NDArray] = None, **kwargs ) -> NDArray: """ Get the conformity score. Parameters ---------- y: NDArray of shape (n_samples,) Observed target values. y_pred: NDArray of shape (n_samples,) Predicted target values. y_enc: NDArray of shape (n_samples,) Target values as normalized encodings. Returns ------- NDArray of shape (n_samples,) Conformity scores. """ # Casting y_enc = cast(NDArray, y_enc) # Conformity scores # Here we reorder the labels by decreasing probability and get the # position of each label from decreasing probability conformity_scores = get_true_label_position(y_pred, y_enc) return conformity_scores
[docs] def get_predictions( self, X: NDArray, alpha_np: NDArray, y_pred_proba: NDArray, cv: Optional[Union[int, str, BaseCrossValidator]], **kwargs, ) -> NDArray: """ Just processes the passed y_pred_proba. Parameters ----------- X: NDArray of shape (n_samples, n_features) Observed feature values (not used since predictions are passed). alpha_np: NDArray of shape (n_alpha,) NDArray of floats between ``0`` and ``1``, represents the uncertainty of the confidence interval. y_pred_proba: NDArray Predicted probabilities from the estimator. cv: Optional[Union[int, str, BaseCrossValidator]] Cross-validation strategy used by the estimator (not used here). Returns -------- NDArray Array of predictions. """ y_pred_proba = np.repeat(y_pred_proba[:, :, np.newaxis], len(alpha_np), axis=2) return y_pred_proba
[docs] def get_conformity_score_quantiles( self, conformity_scores: NDArray, alpha_np: NDArray, cv: Optional[Union[int, str, BaseCrossValidator]], **kwargs, ) -> NDArray: """ Get the quantiles of the conformity scores for each uncertainty level. Parameters ----------- conformity_scores: NDArray of shape (n_samples,) Conformity scores for each sample. alpha_np: NDArray of shape (n_alpha,) NDArray of floats between 0 and 1, representing the uncertainty of the confidence interval. cv: Optional[Union[int, str, BaseCrossValidator]] Cross-validation strategy used by the estimator (not used here). Returns -------- NDArray Array of quantiles with respect to alpha_np. """ return _compute_quantiles(conformity_scores, alpha_np)
[docs] def get_prediction_sets( self, y_pred_proba: NDArray, conformity_scores: NDArray, alpha_np: NDArray, cv: Optional[Union[int, str, BaseCrossValidator]], **kwargs, ) -> NDArray: """ Generate prediction sets based on the probability predictions, the conformity scores and the uncertainty level. Parameters ----------- y_pred_proba: NDArray of shape (n_samples, n_classes) Target prediction. conformity_scores: NDArray of shape (n_samples,) Conformity scores for each sample (not used here). alpha_np: NDArray of shape (n_alpha,) NDArray of floats between 0 and 1, representing the uncertainty of the confidence interval (not used here). cv: Optional[Union[int, str, BaseCrossValidator]] Cross-validation strategy used by the estimator (not used here). Returns -------- NDArray Array of quantiles with respect to alpha_np. """ y_pred_proba = y_pred_proba[:, :, 0] index_sorted = np.fliplr(np.argsort(y_pred_proba, axis=1)) y_pred_index_last = np.stack( [index_sorted[:, quantile] for quantile in self.quantiles_], axis=1 ) y_pred_proba_last = np.stack( [ np.take_along_axis( y_pred_proba, y_pred_index_last[:, iq].reshape(-1, 1), axis=1 ) for iq, _ in enumerate(self.quantiles_) ], axis=2, ) prediction_sets = np.greater_equal( y_pred_proba[:, :, np.newaxis] - y_pred_proba_last, -EPSILON ) return prediction_sets