Source code for dowhy.causal_refuters.reisz

import numpy as np
from econml.grf._base_grf import BaseGRF
from econml.sklearn_extensions.model_selection import GridSearchCVList
from econml.utilities import cross_product
from scipy import stats
from sklearn.compose import ColumnTransformer, make_column_selector
from sklearn.ensemble import (
    GradientBoostingClassifier,
    GradientBoostingRegressor,
    RandomForestClassifier,
    RandomForestRegressor,
)
from sklearn.linear_model import LogisticRegression
from sklearn.pipeline import Pipeline
from sklearn.preprocessing import StandardScaler

from dowhy.utils.regression import create_polynomial_function, generate_moment_function, get_generic_regressor


[docs]def get_alpha_estimator(
    cv, X, max_degree=None, estimator_list=None, estimator_param_list=None, numeric_features=None, plugin_reisz=True
):
    """
    Finds the best estimator for reisz representer (alpha_s )

    :param cv: training and testing data indices obtained afteer Kfolding the dataset
    :param X: treatment+confounders
    :param max_degree: degree of the polynomial function used to approximate alpha_s
    :param param_grid_dict: python dictionary with parameters to tune the ReiszRepresenter estimator

    :returns: estimator for alpha_s

    This method assumes a binary T.
    """

    if plugin_reisz:
        if estimator_param_list is None:
            estimator_list = [
                RandomForestClassifier(n_estimators=100, random_state=120),
                Pipeline(
                    [
                        (
                            "scale",
                            ColumnTransformer([("num", StandardScaler(), numeric_features)], remainder="passthrough"),
                        ),
                        ("logistic_model", LogisticRegression()),
                    ]
                ),
                GradientBoostingClassifier(),
            ]
            estimator_param_list = [
                {"n_estimators": [50], "max_depth": [3, 4, 5], "min_samples_leaf": [10, 50]},
                {"logistic_model__C": [1, 0.01, 0.001, 1e-4, 1e-5]},
                {"learning_rate": [0.01, 0.001], "n_estimators": [50, 200]},
            ]
        W = X[:, 1:]  # assume 1-D treatment
        t = X[:, 0]
        propmodel = get_generic_regressor(
            cv=cv,
            X=W,
            Y=t,
            max_degree=max_degree,
            estimator_list=estimator_list,
            estimator_param_list=estimator_param_list,
            numeric_features=numeric_features,
        )
        reisz_fn = PluginReisz(propmodel)
    else:
        if estimator_param_list is None:
            estimator_param_list = [
                {
                    "reisz_functions": [create_polynomial_function(2), create_polynomial_function(1)],
                    "min_samples_leaf": [10, 50],
                    "min_var_fraction_leaf": [0.01, 0.1],
                    "l2_regularizer": [1e-5, 1e-3],
                    "max_depth": [5, None],
                }
            ]
        estimator = GridSearchCVList(
            [
                ReiszRepresenter(
                    reisz_functions=create_polynomial_function(max_degree),
                    moment_function=generate_moment_function,
                    min_samples_leaf=10,
                    min_var_fraction_leaf=0.01,
                    max_depth=5,
                )
            ],
            param_grid_list=estimator_param_list,
            scoring=reisz_scoring,
            cv=cv,
            verbose=0,
            n_jobs=-1,
        ).fit(X)
        reisz_fn = estimator.best_estimator_
    return reisz_fn


[docs]class PluginReisz:
    """Plugin reisz function for average treatment effect"""

    def __init__(self, propensity_model):
        self.propmodel = propensity_model

[docs]    def fit(self, X):
        W = X[:, 1:]  # assume 1-D treatment
        t = X[:, 0]
        self.propmodel.fit(W, t)
        return self

[docs]    def predict(self, X):
        W = X[:, 1:]  # assume 1-D treatment
        t = X[:, 0]
        preds = self.propmodel.predict_proba(W)
        weights = [1 / preds[i, t[i].astype(int)] for i in range(preds.shape[0])]
        weights = np.where(t == 0, -1, 1) * weights
        return weights

[docs]    def propensity(self, X):
        """
        P(T=1|W)
        """
        W = X[:, 1:]  # assume 1-D treatment
        return self.propmodel.predict_proba(W)[:, 1]


[docs]def reisz_scoring(g, X):
    """
    Returns loss for a estimator model
    :param g: model to be evaluated
    :param X: data for testing the model

    :returns: floating point number that quantifies the model prediction
    Loss(g) = E[2*m(X,g) - g(X)**2]
    """
    loss = np.mean(2 * generate_moment_function(W=X, g=g.predict) - g.predict(X) ** 2)
    return loss


[docs]class ReiszRepresenter(BaseGRF):
    """
    Generalized Random Forest to estimate Reisz Representer (RR)
    See: https://github.com/microsoft/EconML/blob/main/econml/grf/_base_grf.py
    :param reisz_functions: List of polynomial functions of n degree to approximate reisz representer created using create_polynomial_function
    :param moment_function: moment function m(W,g) whose expected value is used to calculate estimate
    :param l2_regularizer: l2 penalty while modeling (default = 1e-3)
    For tuning other parameters see https://econml.azurewebsites.net/_autosummary/econml.grf.CausalForest.html
    """

    def __init__(
        self,
        *,
        reisz_functions,
        moment_function=generate_moment_function,
        l2_regularizer=1e-3,
        n_estimators=100,
        criterion="mse",
        max_depth=None,
        min_samples_split=10,
        min_samples_leaf=5,
        min_weight_fraction_leaf=0.0,
        min_var_fraction_leaf=None,
        min_var_leaf_on_val=False,
        max_features="auto",
        min_impurity_decrease=0.0,
        max_samples=0.45,
        min_balancedness_tol=0.45,
        honest=True,
        inference=True,
        fit_intercept=True,
        subforest_size=4,
        n_jobs=-1,
        random_state=None,
        verbose=0,
        warm_start=False,
    ):

        self.reisz_functions = reisz_functions
        self.moment_function = moment_function
        self.l2_regularizer = l2_regularizer
        self.num_reisz_functions = len(self.reisz_functions)

        super().__init__(
            n_estimators=n_estimators,
            criterion=criterion,
            max_depth=max_depth,
            min_samples_split=min_samples_split,
            min_samples_leaf=min_samples_leaf,
            min_weight_fraction_leaf=min_weight_fraction_leaf,
            min_var_fraction_leaf=min_var_fraction_leaf,
            min_var_leaf_on_val=min_var_leaf_on_val,
            max_features=max_features,
            min_impurity_decrease=min_impurity_decrease,
            max_samples=max_samples,
            min_balancedness_tol=min_balancedness_tol,
            honest=honest,
            inference=inference,
            fit_intercept=False,
            subforest_size=subforest_size,
            n_jobs=n_jobs,
            random_state=random_state,
            verbose=verbose,
            warm_start=warm_start,
        )

    def _get_alpha_and_pointJ(self, X, T, y):
        n_riesz_feats = len(self.reisz_functions)
        TX = np.hstack([T, X])
        riesz_feats = np.hstack([feat_fn(TX) for feat_fn in self.reisz_functions])
        mfeats = np.hstack([self.moment_function(TX, feat_fn) for feat_fn in self.reisz_functions])
        alpha = np.zeros((X.shape[0], n_riesz_feats))
        alpha[:, :n_riesz_feats] = mfeats
        riesz_cov_matrix = cross_product(riesz_feats, riesz_feats).reshape((X.shape[0], n_riesz_feats, n_riesz_feats))
        penalty = self.l2_regularizer * np.eye(n_riesz_feats)
        penalty[0, 0] = 0
        pointJ = riesz_cov_matrix + penalty
        return alpha, pointJ.reshape((X.shape[0], -1))

    def _get_n_outputs_decomposition(self, X, T, y):
        n_relevant_outputs = len(self.reisz_functions)
        n_outputs = n_relevant_outputs
        return n_outputs, n_relevant_outputs

    def _translate(self, point, TX):
        riesz_feats = np.hstack([feat_fn(TX) for feat_fn in self.reisz_functions])
        n_riesz_feats = riesz_feats.shape[1]
        riesz = np.sum(point[:, :n_riesz_feats] * riesz_feats, axis=1)
        return riesz

[docs]    def fit(self, X):
        return super().fit(X[:, 1:], X[:, [0]], X[:, [0]])

[docs]    def predict(self, X_test):
        point = super().predict(X_test[:, 1:])
        return self._translate(point, X_test)