Source code for causalml.metrics.sensitivity

import logging
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
from importlib import import_module

logger = logging.getLogger("sensitivity")

SUMMARY_COLS = ["Method", "ATE", "New ATE", "New ATE LB", "New ATE UB"]


def one_sided(alpha, p, treatment):
    """One sided confounding function.
    Reference:  Blackwell, Matthew. "A selection bias approach to sensitivity analysis
    for causal effects." Political Analysis 22.2 (2014): 169-182.
    https://www.mattblackwell.org/files/papers/causalsens.pdf

    Args:
        alpha (np.array): a confounding values vector
        p (np.array): a propensity score vector between 0 and 1
        treatment (np.array): a treatment vector (1 if treated, otherwise 0)
    """
    assert p.shape[0] == treatment.shape[0]
    adj = alpha * (1 - p) * treatment - alpha * p * (1 - treatment)
    return adj


def alignment(alpha, p, treatment):
    """Alignment confounding function.
    Reference:  Blackwell, Matthew. "A selection bias approach to sensitivity analysis
    for causal effects." Political Analysis 22.2 (2014): 169-182.
    https://www.mattblackwell.org/files/papers/causalsens.pdf

    Args:
        alpha (np.array): a confounding values vector
        p (np.array): a propensity score vector between 0 and 1
        treatment (np.array): a treatment vector (1 if treated, otherwise 0)
    """

    assert p.shape[0] == treatment.shape[0]
    adj = alpha * (1 - p) * treatment + alpha * p * (1 - treatment)
    return adj


def one_sided_att(alpha, p, treatment):
    """One sided confounding function for the average effect of the treatment among the treated units (ATT)

    Reference:  Blackwell, Matthew. "A selection bias approach to sensitivity analysis
    for causal effects." Political Analysis 22.2 (2014): 169-182.
    https://www.mattblackwell.org/files/papers/causalsens.pdf

    Args:
        alpha (np.array): a confounding values vector
        p (np.array): a propensity score vector between 0 and 1
        treatment (np.array): a treatment vector (1 if treated, otherwise 0)
    """
    assert p.shape[0] == treatment.shape[0]
    adj = alpha * (1 - treatment)
    return adj


def alignment_att(alpha, p, treatment):
    """Alignment confounding function for the average effect of the treatment among the treated units (ATT)

    Reference:  Blackwell, Matthew. "A selection bias approach to sensitivity analysis
    for causal effects." Political Analysis 22.2 (2014): 169-182.
    https://www.mattblackwell.org/files/papers/causalsens.pdf

    Args:
        alpha (np.array): a confounding values vector
        p (np.array): a propensity score vector between 0 and 1
        treatment (np.array): a treatment vector (1 if treated, otherwise 0)
    """
    assert p.shape[0] == treatment.shape[0]
    adj = alpha * (1 - treatment)
    return adj


def msm_propensity_bounds(p, gamma):
    """Clipped propensity bounds under the Marginal Sensitivity Model.

    Reference: Tan, Z. (2006); Dorn, J. & Guo, K. (2023); closed-form
    expressions in Dorn, J., Guo, K. & Kallus, N. (2024),
    "Doubly-Valid/Doubly-Sharp Sensitivity Analysis..." arXiv:2112.11449.

    Args:
        p (np.array): estimated propensity score vector, in (0, 1)
        gamma (float): sensitivity parameter, Gamma >= 1

    Returns:
        (tuple of np.array): (p_lower, p_upper) bounds on the true propensity
    """
    p_lower = p / (p + gamma * (1 - p))
    p_upper = gamma * p / (gamma * p + (1 - p))
    return p_lower, p_upper



[docs]
class Sensitivity:
    """A Sensitivity Check class to support Placebo Treatment, Irrelevant Additional Confounder
    and Subset validation refutation methods to verify causal inference.

    Reference: https://github.com/microsoft/dowhy/blob/master/dowhy/causal_refuters/
    """

    def __init__(
        self,
        df,
        inference_features,
        p_col,
        treatment_col,
        outcome_col,
        learner,
        *args,
        **kwargs,
    ):
        """Initialize.

        Args:
            df (pd.DataFrame): input data frame
            inferenece_features (list of str): a list of columns that used in learner for inference
            p_col (str): column name of propensity score
            treatment_col (str): column name of whether in treatment of control
            outcome_col (str): column name of outcome
            learner (model): a model to estimate outcomes and treatment effects
        """

        self.df = df
        self.inference_features = inference_features
        self.p_col = p_col
        self.treatment_col = treatment_col
        self.outcome_col = outcome_col
        self.learner = learner


[docs]
    def get_prediction(self, X, p, treatment, y):
        """Return the treatment effects prediction.

        Args:
            X (np.matrix): a feature matrix
            p (np.array): a propensity score vector between 0 and 1
            treatment (np.array): a treatment vector (1 if treated, otherwise 0)
            y (np.array): an outcome vector
        Returns:
            (numpy.ndarray): Predictions of treatment effects
        """

        learner = self.learner
        try:
            preds = learner.fit_predict(X=X, p=p, treatment=treatment, y=y).flatten()
        except TypeError:
            preds = learner.fit_predict(X=X, treatment=treatment, y=y).flatten()
        return preds



[docs]
    def get_ate_ci(self, X, p, treatment, y):
        """Return the confidence intervals for treatment effects prediction.

        Args:
            X (np.matrix): a feature matrix
            p (np.array): a propensity score vector between 0 and 1
            treatment (np.array): a treatment vector (1 if treated, otherwise 0)
            y (np.array): an outcome vector
        Returns:
            (numpy.ndarray): Mean and confidence interval (LB, UB) of the ATE estimate.
        """

        try:
            ate, ate_lower, ate_upper = self.learner.estimate_ate(
                X=X, p=p, treatment=treatment, y=y, return_ci=True
            )
        except TypeError:
            ate, ate_lower, ate_upper = self.learner.estimate_ate(
                X=X, p=p, treatment=treatment, y=y
            )
        return ate[0], ate_lower[0], ate_upper[0]



[docs]
    @staticmethod
    def get_class_object(method_name, *args, **kwargs):
        """Return class object based on input method
        Args:
            method_name (list of str): a list of sensitivity analysis method
        Returns:
            (class): Sensitivy Class
        """

        method_list = [
            "Placebo Treatment",
            "Random Cause",
            "Subset Data",
            "Random Replace",
            "Selection Bias",
            "MSM",
        ]
        class_name = "Sensitivity" + method_name.replace(" ", "")

        try:
            getattr(import_module("causalml.metrics.sensitivity"), class_name)
            return getattr(import_module("causalml.metrics.sensitivity"), class_name)
        except AttributeError:
            raise AttributeError(
                "{} is not an existing method for sensitiviy analysis.".format(
                    method_name
                )
                + " Select one of {}".format(method_list)
            )



[docs]
    def sensitivity_analysis(
        self, methods, sample_size=None, confound="one_sided", alpha_range=None
    ):
        """Return the sensitivity data by different method

        Args:
            method (list of str): a list of sensitivity analysis method
            sample_size (float, optional): ratio for subset the original data
            confound (string, optional): the name of confouding function
            alpha_range (np.array, optional): a parameter to pass the confounding function

        Returns:
            X (np.matrix): a feature matrix
            p (np.array): a propensity score vector between 0 and 1
            treatment (np.array): a treatment vector (1 if treated, otherwise 0)
            y (np.array): an outcome vector
        """
        if alpha_range is None:
            y = self.df[self.outcome_col]
            iqr = y.quantile(0.75) - y.quantile(0.25)
            alpha_range = np.linspace(-iqr / 2, iqr / 2, 11)
            if 0 not in alpha_range:
                alpha_range = np.append(alpha_range, 0)
        else:
            alpha_range = alpha_range

        alpha_range.sort()

        summary = []
        for method in methods:
            sens = self.get_class_object(method)
            sens = sens(
                self.df,
                self.inference_features,
                self.p_col,
                self.treatment_col,
                self.outcome_col,
                self.learner,
                sample_size=sample_size,
                confound=confound,
                alpha_range=alpha_range,
            )

            if method == "Subset Data":
                method = method + "(sample size @{})".format(sample_size)

            sens_df = sens.summary(method=method)
            summary.append(sens_df.values.tolist()[0])

        summary_df = pd.DataFrame(summary, columns=SUMMARY_COLS)

        return summary_df


    # Learner families whose fit_predict(return_components=True)
    # exposes potential-outcome regressions (mu0_hat, mu1_hat).
    # Unknown learner types are rejected rather than assumed compatible.


[docs]
    def get_potential_outcome_predictions(self, X, p, treatment, y):
        """Return separate potential-outcome predictions mu1_hat, mu0_hat.

        Only supported for S/T/DR-learner-style objects, whose
        fit_predict(..., return_components=True) returns the fitted
        outcome regressions (mu0_hat, mu1_hat) directly. X-learner and
        R-learner are explicitly unsupported: X-learner's "components"
        are two CATE estimates from its second-stage tau models, not
        potential outcomes, and R-learner has no outcome-regression
        decomposition to extract.

        Args:
            X, p, treatment, y: same as get_prediction()
        Returns:
            (tuple of np.array): (mu1_hat, mu0_hat)
        Raises:
            NotImplementedError: if the learner does not expose
                potential-outcome regressions via return_components.
        """
        learner = self.learner
        learner_name = type(learner).__name__
        mro_names = {cls.__name__ for cls in type(learner).__mro__}

        if not (
            "BaseSLearner" in mro_names
            or "BaseTLearner" in mro_names
            or "BaseDRLearner" in mro_names
        ):
            raise NotImplementedError(
                "SensitivityMSM does not support {} yet: it needs potential-"
                "outcome regressions (mu0_hat, mu1_hat), which this learner's "
                "return_components does not expose. Use an S-learner, "
                "T-learner, or DR-learner instead.".format(learner_name)
            )

        try:
            _, yhat_cs, yhat_ts = learner.fit_predict(
                X=X, p=p, treatment=treatment, y=y, return_components=True
            )
        except TypeError:
            try:
                _, yhat_cs, yhat_ts = learner.fit_predict(
                    X=X, treatment=treatment, y=y, return_components=True
                )
            except TypeError:
                raise NotImplementedError(
                    "SensitivityMSM could not extract potential-outcome "
                    "predictions from {}: fit_predict() does not support "
                    "return_components=True.".format(learner_name)
                )
        # yhat_cs/yhat_ts are dicts keyed by treatment group; binary case → one group
        group = list(yhat_cs.keys())[0]
        return yhat_ts[group], yhat_cs[group]



[docs]
    def summary(self, method):
        """Summary report
        Args:
            method_name (str): sensitivity analysis method

        Returns:
            (pd.DataFrame): a summary dataframe
        """
        method_name = method

        X = self.df[self.inference_features].values
        p = self.df[self.p_col].values
        treatment = self.df[self.treatment_col].values
        y = self.df[self.outcome_col].values

        preds = self.get_prediction(X, p, treatment, y)
        ate = preds.mean()
        ate_new, ate_new_lower, ate_new_upper = self.sensitivity_estimate()

        sensitivity_summary = pd.DataFrame(
            [method_name, ate, ate_new, ate_new_lower, ate_new_upper]
        ).T
        sensitivity_summary.columns = SUMMARY_COLS
        return sensitivity_summary



[docs]
    def sensitivity_estimate(self):
        raise NotImplementedError





[docs]
class SensitivityPlaceboTreatment(Sensitivity):
    """Replaces the treatment variable with a new variable randomly generated."""

    def __init__(self, *args, **kwargs):
        super().__init__(*args, **kwargs)


[docs]
    def sensitivity_estimate(self):
        """Summary report
        Args:
           return_ci (str): sensitivity analysis method

        Returns:
            (pd.DataFrame): a summary dataframe
        """
        X = self.df[self.inference_features].values
        p = self.df[self.p_col].values
        treatment = self.df[self.treatment_col].values
        treatment_new = np.random.permutation(treatment)
        y = self.df[self.outcome_col].values

        ate_new, ate_new_lower, ate_new_upper = self.get_ate_ci(X, p, treatment_new, y)
        return ate_new, ate_new_lower, ate_new_upper





[docs]
class SensitivityRandomCause(Sensitivity):
    """Adds an irrelevant random covariate to the dataframe."""

    def __init__(self, *args, **kwargs):
        super().__init__(*args, **kwargs)


[docs]
    def sensitivity_estimate(self):
        num_rows = self.df.shape[0]
        new_data = np.random.randn(num_rows)

        X = self.df[self.inference_features].values
        p = self.df[self.p_col].values
        treatment = self.df[self.treatment_col].values
        y = self.df[self.outcome_col].values
        X_new = np.hstack((X, new_data.reshape((-1, 1))))

        ate_new, ate_new_lower, ate_new_upper = self.get_ate_ci(X_new, p, treatment, y)
        return ate_new, ate_new_lower, ate_new_upper





[docs]
class SensitivityRandomReplace(Sensitivity):
    """Replaces a random covariate with an irrelevant variable."""

    def __init__(self, *args, **kwargs):
        super().__init__(*args, **kwargs)
        if "replaced_feature" not in kwargs:
            replaced_feature_index = np.random.randint(len(self.inference_features))
            self.replaced_feature = self.inference_features[replaced_feature_index]
        else:
            self.replaced_feature = kwargs["replaced_feature"]


[docs]
    def sensitivity_estimate(self):
        """Replaces a random covariate with an irrelevant variable."""

        logger.info(
            "Replace feature {} with an random irrelevant variable".format(
                self.replaced_feature
            )
        )
        df_new = self.df.copy()
        num_rows = self.df.shape[0]
        df_new[self.replaced_feature] = np.random.randn(num_rows)

        X_new = df_new[self.inference_features].values
        p_new = df_new[self.p_col].values
        treatment_new = df_new[self.treatment_col].values
        y_new = df_new[self.outcome_col].values

        ate_new, ate_new_lower, ate_new_upper = self.get_ate_ci(
            X_new, p_new, treatment_new, y_new
        )
        return ate_new, ate_new_lower, ate_new_upper





[docs]
class SensitivitySubsetData(Sensitivity):
    """Takes a random subset of size sample_size of the data."""

    def __init__(self, *args, **kwargs):
        super().__init__(*args, **kwargs)
        self.sample_size = kwargs["sample_size"]
        assert self.sample_size is not None


[docs]
    def sensitivity_estimate(self):
        df_new = self.df.sample(frac=self.sample_size).copy()

        X_new = df_new[self.inference_features].values
        p_new = df_new[self.p_col].values
        treatment_new = df_new[self.treatment_col].values
        y_new = df_new[self.outcome_col].values

        ate_new, ate_new_lower, ate_new_upper = self.get_ate_ci(
            X_new, p_new, treatment_new, y_new
        )
        return ate_new, ate_new_lower, ate_new_upper





[docs]
class SensitivitySelectionBias(Sensitivity):
    """Reference:

    [1] Blackwell, Matthew. "A selection bias approach to sensitivity analysis
    for causal effects." Political Analysis 22.2 (2014): 169-182.
    https://www.mattblackwell.org/files/papers/causalsens.pdf

    [2] Confouding parameter alpha_range using the same range as in:
    https://github.com/mattblackwell/causalsens/blob/master/R/causalsens.R

    """

    def __init__(
        self,
        *args,
        confound="one_sided",
        alpha_range=None,
        sensitivity_features=None,
        **kwargs,
    ):
        super().__init__(*args, **kwargs)
        """Initialize.

        Args:
            confound (string): the name of confouding function
            alpha_range (np.array): a parameter to pass the confounding function
            sensitivity_features (list of str): ): a list of columns that to check each individual partial r-square
        """

        logger.info("Only works for linear outcome models right now. Check back soon.")
        confounding_functions = {
            "one_sided": one_sided,
            "alignment": alignment,
            "one_sided_att": one_sided_att,
            "alignment_att": alignment_att,
        }

        try:
            confound_func = confounding_functions[confound]
        except KeyError:
            raise NotImplementedError(
                f"Confounding function, {confound} is not implemented. \
                                        Use one of {confounding_functions.keys()}"
            )

        self.confound = confound_func

        if sensitivity_features is None:
            self.sensitivity_features = self.inference_features
        else:
            self.sensitivity_features = sensitivity_features

        if alpha_range is None:
            y = self.df[self.outcome_col]
            iqr = y.quantile(0.75) - y.quantile(0.25)
            self.alpha_range = np.linspace(-iqr / 2, iqr / 2, 11)
            if 0 not in self.alpha_range:
                self.alpha_range = np.append(self.alpha_range, 0)
        else:
            self.alpha_range = alpha_range

        self.alpha_range.sort()


[docs]
    def causalsens(self):
        alpha_range = self.alpha_range
        confound = self.confound
        df = self.df
        X = df[self.inference_features].values
        p = df[self.p_col].values
        treatment = df[self.treatment_col].values
        y = df[self.outcome_col].values

        preds = self.get_prediction(X, p, treatment, y)

        sens_df = pd.DataFrame()

        sens = []
        for a in alpha_range:
            adj = confound(a, p, treatment)
            preds_adj = y - adj
            s_preds = self.get_prediction(X, p, treatment, preds_adj)
            ate, ate_lb, ate_ub = self.get_ate_ci(X, p, treatment, preds_adj)

            s_preds_residul = preds_adj - s_preds
            rsqs = a**2 * np.var(treatment) / np.var(s_preds_residul)

            sens.append([a, rsqs, ate, ate_lb, ate_ub])

        sens_df = pd.DataFrame(
            sens, columns=["alpha", "rsqs", "New ATE", "New ATE LB", "New ATE UB"]
        )

        rss = np.sum(np.square(y - preds))
        partial_rsqs = []
        for feature in self.sensitivity_features:
            df_new = df.copy()
            X_new = df_new[self.inference_features].drop(feature, axis=1).copy()
            y_new_preds = self.get_prediction(X_new, p, treatment, y)
            rss_new = np.sum(np.square(y - y_new_preds))
            partial_rsqs.append(((rss_new - rss) / rss))

        partial_rsqs_df = pd.DataFrame([self.sensitivity_features, partial_rsqs]).T
        partial_rsqs_df.columns = ["feature", "partial_rsqs"]

        return sens_df, partial_rsqs_df



[docs]
    def summary(self, method="Selection Bias"):
        """Summary report for Selection Bias Method
        Args:
            method_name (str): sensitivity analysis method
        Returns:
            (pd.DataFrame): a summary dataframe
        """

        method_name = method
        sensitivity_summary = self.causalsens()[0]
        sensitivity_summary["Method"] = [
            method_name + " (alpha@" + str(round(i, 5)) + ", with r-sqaure:"
            for i in sensitivity_summary.alpha
        ]
        sensitivity_summary["Method"] = sensitivity_summary[
            "Method"
        ] + sensitivity_summary["rsqs"].round(5).astype(str)
        sensitivity_summary["ATE"] = sensitivity_summary[
            sensitivity_summary.alpha == 0
        ]["New ATE"]
        return sensitivity_summary[SUMMARY_COLS]



[docs]
    @staticmethod
    def plot(sens_df, partial_rsqs_df=None, type="raw", ci=False, partial_rsqs=False):
        """Plot the results of a sensitivity analysis against unmeasured
        Args:
            sens_df (pandas.DataFrame): a data frame output from causalsens
            partial_rsqs_d (pandas.DataFrame) : a data frame output from causalsens including partial rsqure
            type (str, optional): the type of plot to draw, 'raw' or 'r.squared' are supported
            ci (bool, optional): whether plot confidence intervals
            partial_rsqs (bool, optional): whether plot partial rsquare results
        """

        if type == "raw" and not ci:
            fig, ax = plt.subplots()
            y_max = round(sens_df["New ATE UB"].max() * 1.1, 4)
            y_min = round(sens_df["New ATE LB"].min() * 0.9, 4)
            x_max = round(sens_df.alpha.max() * 1.1, 4)
            x_min = round(sens_df.alpha.min() * 0.9, 4)
            plt.ylim(y_min, y_max)
            plt.xlim(x_min, x_max)
            ax.plot(sens_df.alpha, sens_df["New ATE"])
        elif type == "raw" and ci:
            fig, ax = plt.subplots()
            y_max = round(sens_df["New ATE UB"].max() * 1.1, 4)
            y_min = round(sens_df["New ATE LB"].min() * 0.9, 4)
            x_max = round(sens_df.alpha.max() * 1.1, 4)
            x_min = round(sens_df.alpha.min() * 0.9, 4)
            plt.ylim(y_min, y_max)
            plt.xlim(x_min, x_max)
            ax.fill_between(
                sens_df.alpha,
                sens_df["New ATE LB"],
                sens_df["New ATE UB"],
                color="gray",
                alpha=0.5,
            )
            ax.plot(sens_df.alpha, sens_df["New ATE"])
        elif type == "r.squared" and ci:
            fig, ax = plt.subplots()
            y_max = round(sens_df["New ATE UB"].max() * 1.1, 4)
            y_min = round(sens_df["New ATE LB"].min() * 0.9, 4)
            plt.ylim(y_min, y_max)
            ax.fill_between(
                sens_df.rsqs,
                sens_df["New ATE LB"],
                sens_df["New ATE UB"],
                color="gray",
                alpha=0.5,
            )
            ax.plot(sens_df.rsqs, sens_df["New ATE"])
            if partial_rsqs:
                plt.scatter(
                    partial_rsqs_df.partial_rsqs,
                    list(sens_df[sens_df.alpha == 0]["New ATE"])
                    * partial_rsqs_df.shape[0],
                    marker="x",
                    color="red",
                    linewidth=10,
                )
        elif type == "r.squared" and not ci:
            fig, ax = plt.subplots()
            y_max = round(sens_df["New ATE UB"].max() * 1.1, 4)
            y_min = round(sens_df["New ATE LB"].min() * 0.9, 4)
            plt.ylim(y_min, y_max)
            plt.plot(sens_df.rsqs, sens_df["New ATE"])
            if partial_rsqs:
                plt.scatter(
                    partial_rsqs_df.partial_rsqs,
                    list(sens_df[sens_df.alpha == 0]["New ATE"])
                    * partial_rsqs_df.shape[0],
                    marker="x",
                    color="red",
                    linewidth=10,
                )



[docs]
    @staticmethod
    def partial_rsqs_confounding(sens_df, feature_name, partial_rsqs_value, range=0.01):
        """Check partial rsqs values of feature corresponding confounding amonunt of ATE
        Args:
            sens_df (pandas.DataFrame): a data frame output from causalsens
            feature_name (str): feature name to check
            partial_rsqs_value (float) : partial rsquare value of feature
            range (float) : range to search from sens_df

        Return: min and max value of confounding amount
        """

        rsqs_dict = []
        for i in sens_df.rsqs:
            if (
                partial_rsqs_value - partial_rsqs_value * range
                < i
                < partial_rsqs_value + partial_rsqs_value * range
            ):
                rsqs_dict.append(i)

        if rsqs_dict:
            confounding_min = sens_df[sens_df.rsqs.isin(rsqs_dict)].alpha.min()
            confounding_max = sens_df[sens_df.rsqs.isin(rsqs_dict)].alpha.max()
            logger.info(
                "Only works for linear outcome models right now. Check back soon."
            )
            logger.info(
                "For feature {} with partial rsquare {} confounding amount with possible values: {}, {}".format(
                    feature_name, partial_rsqs_value, confounding_min, confounding_max
                )
            )
            return [confounding_min, confounding_max]
        else:
            logger.info(
                "Cannot find correponding rsquare value within the range for input, please edit confounding",
                "values vector or use a larger range and try again",
            )




class SensitivityMSM(Sensitivity):
    """Sensitivity bounds for the ATE under the Marginal Sensitivity Model (MSM).

    Reference:
        Tan, Z. (2006). "A distributional approach for causal inference
        using propensity scores."
        Dorn, J. & Guo, K. (2023). "Sharp sensitivity analysis for inverse
        propensity weighting via quantile balancing." JASA.
        Dorn, J., Guo, K. & Kallus, N. (2024). "Doubly-valid/doubly-sharp
        sensitivity analysis for causal inference with unmeasured
        confounding." arXiv:2112.11449.

    Note:
        This reports a Gamma (propensity odds-ratio) bound, which is a
        different quantity from the partial-R^2 robustness value used by
        EconML/DoWhy — the two are not directly comparable.

        As with the rest of this module, this is fragility-diagnostic
        tooling, not a license for observational causal inference; see
        causalml's HTE-for-experiments framing (issue #725).

        Supported learners: S-learner, T-learner, DR-learner (any learner
        whose fit_predict(return_components=True) returns potential-outcome
        regressions mu0_hat, mu1_hat). X-learner and R-learner are not yet
        supported and will raise NotImplementedError.
    """

    def __init__(self, *args, gamma=None, **kwargs):
        super().__init__(*args, **kwargs)
        self.gamma = gamma if gamma is not None else [1.0, 1.5, 2.0, 3.0]

    @staticmethod
    def _treatment_indicator(treatment, control_name):
        """Coerce a (possibly string-labeled) treatment vector to a 0/1 float array."""
        return (treatment != control_name).astype(float)

    def _bounds_for_gamma(self, mu1_hat, mu0_hat, p, t, y, gamma):
        """Sharp elementwise MSM bound for a single Gamma, given precomputed
        potential-outcome predictions.

        Each unit's propensity is clipped toward whichever extreme
        (p_lower or p_upper) makes that unit's residual push the bound in
        the requested direction, per Dorn & Guo (2023) / Dorn, Guo & Kallus
        (2024).

        Args:
            mu1_hat, mu0_hat (np.array): fitted potential-outcome predictions
            p (np.array): propensity score vector
            t (np.array): 0/1 treatment indicator
            y (np.array): outcome vector
            gamma (float): sensitivity parameter, >= 1.0
        Returns:
            (tuple of float): (ate_lower, ate_upper)
        """
        p_lower, p_upper = msm_propensity_bounds(p, gamma)

        eps = np.finfo(float).eps
        p_lower = np.clip(p_lower, eps, 1.0 - eps)
        p_upper = np.clip(p_upper, eps, 1.0 - eps)

        resid_t = y - mu1_hat
        resid_c = y - mu0_hat

        # Upper bound: every unit's propensity is clipped toward whichever
        # extreme maximizes that unit's own contribution to the AIPW sum
        # (treated and control arms use the same directional rule, since
        # the sign convention already differs via the (1 - pi) denominator).
        w_t_ub = np.where(resid_t >= 0, p_lower, p_upper)
        w_c_ub = np.where(resid_c >= 0, p_lower, p_upper)
        ub = np.mean(
            (mu1_hat - mu0_hat)
            + t * resid_t / w_t_ub
            - (1 - t) * resid_c / (1 - w_c_ub)
        )

        # Lower bound: the mirrored (minimizing) choice for every unit.
        w_t_lb = np.where(resid_t >= 0, p_upper, p_lower)
        w_c_lb = np.where(resid_c >= 0, p_upper, p_lower)
        lb = np.mean(
            (mu1_hat - mu0_hat)
            + t * resid_t / w_t_lb
            - (1 - t) * resid_c / (1 - w_c_lb)
        )

        return lb, ub

    def get_msm_bounds(self, gamma=None):
        """Return ATE bounds for a range of Gamma values.

        Args:
            gamma (list of float, optional): sensitivity parameters, each >= 1

        Returns:
            (pd.DataFrame): columns ["gamma", "ate_lower", "ate_upper"]
        """
        gamma_list = gamma if gamma is not None else self.gamma
        if any(g < 1.0 for g in gamma_list):
            raise ValueError("All gamma values must be >= 1.0")

        X = self.df[self.inference_features].values
        p = self.df[self.p_col].values
        treatment_raw = self.df[self.treatment_col].values
        y = self.df[self.outcome_col].values

        control_name = getattr(self.learner, "control_name", 0)
        t = self._treatment_indicator(treatment_raw, control_name)

        # Fit once — mu1_hat/mu0_hat don't depend on gamma.
        mu1_hat, mu0_hat = self.get_potential_outcome_predictions(
            X, p, treatment_raw, y
        )

        rows = []
        for g in sorted(set(gamma_list)):
            lb, ub = self._bounds_for_gamma(mu1_hat, mu0_hat, p, t, y, g)
            rows.append([g, lb, ub])
        return pd.DataFrame(rows, columns=["gamma", "ate_lower", "ate_upper"])

    def sensitivity_estimate(self):
        """Satisfies the base class interface: returns the point estimate
        (Gamma=1) and bounds at the largest requested Gamma."""
        gamma_list = sorted(set([1.0] + list(self.gamma)))
        bounds_df = self.get_msm_bounds(gamma=gamma_list)
        ate = bounds_df.loc[bounds_df.gamma == 1.0, "ate_lower"].values[0]
        ate_lower = bounds_df["ate_lower"].min()
        ate_upper = bounds_df["ate_upper"].max()
        return ate, ate_lower, ate_upper