Source code for holisticai.bias.mitigation.postprocessing.calibrated_eq_odds_postprocessing

from __future__ import annotations

from typing import Literal

import numpy as np
from holisticai.utils.transformers.bias import BMPostprocessing as BMPost



[docs]
class CalibratedEqualizedOdds(BMPost):
    r"""
    Calibrated equalized odds postprocessing optimizes over calibrated classifier score outputs to find \
    probabilities with which to change output labels with an equalized odds objective.

    Parameters
    ----------
    cost_constraint : str
        Strategy used to evalute the cost function  The available contraints  are: "fnr", "fpr", "weighted" \
        false negative rate (fnr), false positive rate (fpr), and weighted

    alpha : float
        Used only with cost contraint  "weighted".
        Value between 0 and 1 used to combine fnr and fpr cost constraint.

    seed: int
        A seed value for random number generators. This ensures reproducibility of results.

    Examples
    --------
    >>> from holisticai.bias.mitigation import CalibratedEqualizedOdds
    >>> mitigator = CalibratedEqualizedOdds(**params)
    >>> mitigator.fit(y, y_proba, group_a, group_b)
    >>> test_data_transformed = mitigator.predict(y_pred, y_proba, group_a, group_b)

    References
    ----------
    .. [1] Pleiss, Geoff, et al. “On fairness and calibration.” Advances in neural information processing systems 30 (2017).

    """

    COST_CONSTRAINT = Literal["fnr", "fpr", "weighted"]

    def __init__(
        self,
        cost_constraint: str = "fnr",
        alpha: float | None = None,
        seed: int | None = 42,
    ):
        self.cost_constraint = cost_constraint
        self.alpha = alpha
        self.random_state = np.random.RandomState(seed)

    def _build_cost(self, y, y_score, base_rate, sample_weight):
        if self.cost_constraint == "fpr":
            alpha = 0
        elif self.cost_constraint == "fnr":
            alpha = 1
        elif self.cost_constraint == "weighted":
            alpha = base_rate if self.alpha is None else self.alpha
        else:
            msg = f"unknown cost constraint: {self.cost_constraint}"
            raise ValueError(msg)

        gfpr = _generalized_fpr(y, y_score, sample_weight=sample_weight)
        gfnr = _generalized_fnr(y, y_score, sample_weight=sample_weight)

        return (1 - alpha) * gfpr + alpha * gfnr

    def _build_cost_variables(self, y, y_score, sample_weight):
        base_rate = y.mean()

        def build_cost(score):
            return self._build_cost(y=y, y_score=score, base_rate=base_rate, sample_weight=sample_weight)

        cost = build_cost(y_score)
        trivial_cost = build_cost(np.full_like(y_score, base_rate))
        return base_rate, cost, trivial_cost

    def _mitigate_bias_score(self, y_score, group, mix_rate, base_rate):
        indexes = self.random_state.random(sum(group)) <= mix_rate
        new_y_score = y_score[group == 1].copy()
        new_y_score[indexes] = base_rate
        return new_y_score


[docs]
    def fit(
        self,
        y: np.ndarray,
        y_proba: np.ndarray,
        group_a: np.ndarray,
        group_b: np.ndarray,
        sample_weight: np.ndarray | None = None,
    ):
        """
        Compute parameters for calibrated equalized odds.

        Description
        ----------
        Compute parameters for calibrated equalized odds algorithm.

        Parameters
        ----------
        y : array-like
            Target vector
        y_proba : matrix-like
            Predicted probability matrix (num_examples, num_classes). The probability
            estimates must sum to 1 across the possible classes and each matrix value
            must be in the interval [0,1].
        group_a : array-like
            Group membership vector (binary)
        group_b : array-like
            Group membership vector (binary)
        sample_weight : array-like
            Sample weights. Used to weight generalized false positive rate (GFPR) and
            generalized false negative rate (GFNR). Sample weights could be used during training
            or computed by previous preprocessing strategy.
        Returns
        -------
            Self
        """
        params = self._load_data(
            y=y,
            y_proba=y_proba,
            group_a=group_a,
            group_b=group_b,
            sample_weight=sample_weight,
        )

        group_a = params["group_a"] == 1
        group_b = params["group_b"] == 1
        y = params["y"]
        y_score = params["y_score"]
        sample_weight = params["sample_weight"]

        self.base_rate_a, a_cost, a_trivial_cost = self._build_cost_variables(
            y[group_a], y_score[group_a], sample_weight=sample_weight[group_a]
        )

        self.base_rate_b, b_cost, b_trivial_cost = self._build_cost_variables(
            y[group_b], y_score[group_b], sample_weight=sample_weight[group_b]
        )

        b_costs_more = b_cost > a_cost
        self.a_mix_rate = (b_cost - a_cost) / (a_trivial_cost - a_cost) if b_costs_more else 0
        self.b_mix_rate = 0 if b_costs_more else (a_cost - b_cost) / (b_trivial_cost - b_cost)
        return self



[docs]
    def transform(
        self,
        y_pred: np.ndarray,
        y_proba: np.ndarray,
        group_a: np.ndarray,
        group_b: np.ndarray,
        threshold: float | None = 0.5,
    ):
        """
        Apply transform function to predictions and likelihoods

        Description
        ----------
        Use a fitted probability to change the output label and invert the likelihood

        Parameters
        ----------
        y_pred : array-like
            Predicted vector (nb_examlpes,)
        y_proba : matrix-like
            Predicted probability matrix (num_examples, num_classes). The probability
            estimates must sum to 1 across the possible classes and each matrix value
            must be in the interval [0,1].
        group_a : array-like
            Group membership vector (binary)
        group_b : array-like
            Group membership vector (binary)
        threshold : float
            float value to discriminate between 0 and 1

        Returns
        -------
        dict
            A dictionary of new predictions
        """

        params = self._load_data(y_pred=y_pred, y_proba=y_proba, group_a=group_a, group_b=group_b)

        group_a = params["group_a"] == 1
        group_b = params["group_b"] == 1
        y_pred = params["y_pred"]
        y_score = params["y_score"]

        new_y_score_a = self._mitigate_bias_score(y_score, group_a, self.a_mix_rate, self.base_rate_a)
        new_y_score_b = self._mitigate_bias_score(y_score, group_b, self.b_mix_rate, self.base_rate_b)

        new_y_score = y_score.copy()
        new_y_score[group_a] = new_y_score_a
        new_y_score[group_b] = new_y_score_b

        new_y_pred = y_pred.copy()
        new_y_pred[group_a] = np.where(new_y_score[group_a] >= threshold, 1, 0)
        new_y_pred[group_b] = np.where(new_y_score[group_b] >= threshold, 1, 0)

        return {
            "y_pred": new_y_pred,
            "y_score": new_y_score,
        }



[docs]
    def fit_transform(
        self,
        y: np.ndarray,
        y_proba: np.ndarray,
        group_a: np.ndarray,
        group_b: np.ndarray,
        sample_weight: np.ndarray | None = None,
        threshold: float | None = 0.5,
    ):
        """
        Fit and transform

        Description
        ----------
        Fit and transform

        Parameters
        ----------
        y : array-like
            Target vector
        y_proba : matrix-like
            Predicted probability matrix (num_examples, num_classes). The probability
            estimates must sum to 1 across the possible classes and each matrix value
            must be in the interval [0,1].
        group_a : array-like
            Group membership vector (binary)
        group_b : array-like
            Group membership vector (binary)
        sample_weight : array-like
            Sample weights. Used to weight generalized false positive rate (GFPR) and
            generalized false negative rate (GFNR). Sample weights could be used during training
            or computed by previous preprocessing strategy.

        threshold : float
            float value to discriminate between 0 and 1

        Returns
        -------
        dict
            A dictionary of new predictions
        """
        return self.fit(
            y,
            y_proba,
            group_a,
            group_b,
            sample_weight,
        ).transform(y, y_proba, group_a, group_b, threshold)




def _generalized_fpr(y, y_score, sample_weight):
    neg_idx = y != 1
    neg_weights = sample_weight[neg_idx]
    neg = neg_weights.sum()
    return (y_score[neg_idx] * neg_weights).sum() / neg


def _generalized_fnr(y, y_score, sample_weight):
    pos_idx = y == 1
    pos_weights = sample_weight[pos_idx]
    pos = pos_weights.sum()
    return ((1 - y_score)[pos_idx] * pos_weights).sum() / pos