Source code for whynot.simulators.delayed_impact.simulator

"""Implementation of delayed impact lending simulator based on Liu et al.

Liu, L., Dean, S., Rolf, E., Simchowitz, M., & Hardt, M. (2018, July). Delayed
Impact of Fair Machine Learning. In International Conference on Machine
Learning. (https://arxiv.org/abs/1803.04383)
"""
import copy
import dataclasses
import os
from typing import Callable

import whynot as wn
import whynot.traceable_numpy as np
from whynot.dynamics import BaseConfig, BaseState, BaseIntervention
from whynot.simulators.delayed_impact.fico import get_data_args as get_FICO_data


#################################
# Globally accessible FICO params
#################################
DATAPATH = os.path.join(os.path.dirname(os.path.realpath(__file__)), "data")
INV_CDFS, LOAN_REPAY_PROBS, _, GROUP_SIZE_RATIO, _, _ = get_FICO_data(DATAPATH)


def default_credit_scorer(score):
    """Report the underlying score without modification."""
    return score


[docs]@dataclasses.dataclass
class Config(BaseConfig):
    # pylint: disable-msg=too-few-public-methods
    """Parameters for the simulation dynamics."""

    #: Maps the true credit score to the reported score
    credit_scorer: Callable = default_credit_scorer

    #: Lending threshold for group 0
    threshold_g0: float = 650
    #: Lending threshold for group 1
    threshold_g1: float = 650

    #: Bank repayment utility
    repayment_utility: float = 1.0
    #: Bank default utility
    default_utility: float = -4.0

    #: Applicant's score change after repayment
    repayment_score_change: float = 75
    #: Applican't score change after default
    default_score_change: float = -150

    #: Minimum credit score
    min_score: int = 350
    max_score: int = 800

    #: Simulation start step (in rounds)
    start_time: float = 0

    #: Simulation end step (in rounds)
    end_time: float = 1

    #: Simulator step size (Unused)
    delta_t: float = 1


[docs]@dataclasses.dataclass
class State(BaseState):
    # pylint: disable-msg=too-few-public-methods
    """State of the lending simulator."""

    #: Group membership (sensitive attribute) 0 or 1
    group: int = 0
    #: Agent credit score
    credit_score: int = 700
    #: Running total of the banks profit/loss for the agent
    profits: float = 0


[docs]class Intervention(BaseIntervention):
    # pylint: disable-msg=too-few-public-methods
    """Parameterization of an intervention in the lending model.

    Examples
    --------
    >>> # Change the group 0 threshold to 700
    >>> Intervention(time=0, threshold_g0=700)

    """

[docs]    def __init__(self, time=100, **kwargs):
        """Specify an intervention in the dynamical system.

        Parameters
        ----------
            time: int
                Time of the intervention (days)
            kwargs: dict
                Only valid keyword arguments are parameters of Config.

        """
        super(Intervention, self).__init__(Config, time, **kwargs)


def lending_policy(config, group, score):
    """Determine whether or not a bank gives a loan."""
    # P(T = 1 | X, A=j) = 1     if X >= tau_j
    #                     0     otherwise.
    return (score >= config.threshold_g0) ** (1 - group) * (
        score >= config.threshold_g1
    ) ** group


def determine_repayment(rng, group, score):
    """Determine whether or not the agent repays the loan."""
    repayment_rate = (
        LOAN_REPAY_PROBS[0](score) ** (1 - group) * LOAN_REPAY_PROBS[1](score) ** group
    )
    # Sample a Bernoulli with the Gumbel-max trick to permit causal graph
    # tracing
    uniform = rng.uniform()
    return (
        np.log(repayment_rate / (1.0 - repayment_rate))
        + np.log(uniform / (1.0 - uniform))
    ) > 0.0


def update_score(config, score, loan_approved, repaid):
    """Update the agent's credit score after a lending interaction."""
    score_change = (
        config.repayment_score_change ** repaid ** loan_approved
        * config.default_score_change ** (1 - repaid) ** loan_approved
        * 0.0 ** (1 - loan_approved)
    )
    new_score = score + score_change
    return np.minimum(np.maximum(new_score, config.min_score), config.max_score)


def update_profits(config, profits, loan_approved, repaid):
    """Update the running total bank profit for the individual."""
    profit_change = (
        config.repayment_utility ** repaid ** loan_approved
        * config.default_utility ** (1 - repaid) ** loan_approved
        * 0.0 ** (1 - loan_approved)
    )
    return profits + profit_change


def dynamics(state, time, config, intervention=None, rng=None):
    """Update equations for the lending simulaton.

    Performs one round of interaction between the agent (represented
    by the state) and the bank.

    Parameters
    ----------
        state: whynot.simulators.delayed_impact.State
            Agent state at the beginning of the interaction.
        time: int
            Current round of interaction
        config: whynot.simulators.delayed_impact.Config
            Configuration object controlling the interaction, e.g. lending
            threshold and credit scoring
        intervention: whynot.simulators.delayed_impact.Intervention
            Intervention object specifying when and how to update the dynamics.
        rng: np.RandomState
            Seed random number generator for all randomness (optional)

    Returns
    -------
        state: whynot.simulators.delayed_impact.State
            Agent state after one lending interaction.

    """
    if intervention and time >= intervention.time:
        config = config.update(intervention)

    if rng is None:
        rng = np.random.RandomState(None)

    group, score, individual_profits = state

    # Credit bureau measures the agent's score
    measured_score = config.credit_scorer(score)

    # Bank decides whether or not to extend the user a loan
    loan_approved = lending_policy(config, group, measured_score)

    # The user (potentially) repays the loan
    repaid = determine_repayment(rng, group, score)

    # The credit score updates in response
    new_score = update_score(config, score, loan_approved, repaid)

    new_profits = update_profits(config, individual_profits, loan_approved, repaid)

    return group, new_score, new_profits


def simulate(initial_state, config, intervention=None, seed=None):
    """Simulate a run of the lending simulator.

    The simulation starts at initial_state, representing an agent before
    interacting with the lending institution. The simulator evolves the agent
    state through (repeated) interaction between the agent and the lender.  The
    dynamics encapsulate how the lending decisions and policies effect both the
    agent and the lender's profit. The parameters of the dynamics, e.g. the
    lending thresholds or the repayment model, are specified in the Config.

    Parameters
    ----------
        initial_state:  `whynot.simulators.delayed_impact.State`
            Initial State object, which is used as x_{t_0} for the simulator.
        config:  `whynot.simulators.delayed_impact.Config`
            Config object that encapsulates the parameters that define the dynamics.
        intervention: `whynot.simulators.delayed_impact.Intervention`
            Intervention object that specifies what, if any, intervention to perform.
        seed: int
            Seed to set internal randomness.

    Returns
    -------
        run: `whynot.dynamics.Run`
            Rollout of the model.

    """
    rng = np.random.RandomState(seed)

    # Iterate the discrete dynamics
    times = [config.start_time]
    states = [initial_state]
    state = copy.deepcopy(initial_state)
    for step in range(config.start_time, config.end_time):
        next_state = dynamics(state.values(), step, config, intervention, rng)
        state = State(*next_state)
        states.append(state)
        times.append(step + 1)

    return wn.dynamics.Run(states=states, times=times)


if __name__ == "__main__":
    print(simulate(State(), Config(end_time=20)))
Source code for whynot.simulators.delayed_impact.simulator

whynot

Navigation

Related Topics