From 06f85feeb730aa36532bf0791529ecf49f316372 Mon Sep 17 00:00:00 2001 From: Fabio Vera Date: Fri, 22 Sep 2023 12:28:25 -0400 Subject: [PATCH 01/25] initial commit for binary outcome, warn when clf passed but disc_treat=False Signed-off-by: Fabio Vera --- econml/_ortho_learner.py | 56 +++++++++++++++++++++-------- econml/dml/_rlearner.py | 5 +-- econml/dml/causal_forest.py | 6 +++- econml/dml/dml.py | 44 ++++++++++++++++++----- econml/iv/dml/_dml.py | 58 ++++++++++++++++++++---------- econml/iv/dr/_dr.py | 55 ++++++++++++++++++++-------- econml/panel/dml/_dml.py | 14 +++++--- econml/tests/test_ortho_learner.py | 18 +++++----- 8 files changed, 184 insertions(+), 72 deletions(-) diff --git a/econml/_ortho_learner.py b/econml/_ortho_learner.py index becff2499..498376f1d 100644 --- a/econml/_ortho_learner.py +++ b/econml/_ortho_learner.py @@ -432,10 +432,17 @@ def _gen_ortho_learner_model_final(self): """ def __init__(self, *, - discrete_treatment, treatment_featurizer, - discrete_instrument, categories, cv, random_state, - mc_iters=None, mc_agg='mean'): + binary_outcome, + discrete_treatment, + treatment_featurizer, + discrete_instrument, + categories, + cv, + random_state, + mc_iters=None, + mc_agg='mean'): self.cv = cv + self.binary_outcome = binary_outcome self.discrete_treatment = discrete_treatment self.treatment_featurizer = treatment_featurizer self.discrete_instrument = discrete_instrument @@ -525,21 +532,42 @@ def _subinds_check_none(self, var, inds): def _strata(self, Y, T, X=None, W=None, Z=None, sample_weight=None, freq_weight=None, sample_var=None, groups=None, cache_values=False, only_final=False, check_input=True): + arrs = [] + if self.binary_outcome: + arrs.append(Y) + if self.discrete_treatment: + arrs.append(T) if self.discrete_instrument: - Z = LabelEncoder().fit_transform(np.ravel(Z)) + arrs.append(Z) - if self.discrete_treatment: - enc = LabelEncoder() - T = enc.fit_transform(np.ravel(T)) - if self.discrete_instrument: - return T + Z * len(enc.classes_) - else: - return T - elif self.discrete_instrument: - return Z - else: + return self._single_strata_from_discrete_arrays(arrs) + + """ + Combine multiple discrete arrays into a single array for stratification purposes: + + e.g. if arrs are + [0 1 2 0 1 2 0 1 2 0 1 2], + [0 1 0 1 0 1 0 1 0 1 0 1], + [0 0 0 0 0 0 1 1 1 1 1 1] + then output will be + [0 8 4 6 2 10 1 9 5 7 3 11] + + Every distinct combination of these discrete arrays will have it's own label. + """ + + def _single_strata_from_discrete_arrays(self, arrs): + if not arrs: return None + curr_array = np.zeros(shape=arrs[0].ravel().shape, dtype='int') + + for arr in arrs: + enc = LabelEncoder() + temp = enc.fit_transform(arr.ravel()) + curr_array = temp + curr_array * len(enc.classes_) + + return curr_array + def _prefit(self, Y, T, *args, only_final=False, **kwargs): # generate an instance of the final model diff --git a/econml/dml/_rlearner.py b/econml/dml/_rlearner.py index d13b99a2f..f5362f288 100644 --- a/econml/dml/_rlearner.py +++ b/econml/dml/_rlearner.py @@ -271,9 +271,10 @@ def _gen_rlearner_model_final(self): is multidimensional, then the average of the MSEs for each dimension of Y is returned. """ - def __init__(self, *, discrete_treatment, treatment_featurizer, categories, + def __init__(self, *, binary_outcome, discrete_treatment, treatment_featurizer, categories, cv, random_state, mc_iters=None, mc_agg='mean'): - super().__init__(discrete_treatment=discrete_treatment, + super().__init__(binary_outcome=binary_outcome, + discrete_treatment=discrete_treatment, treatment_featurizer=treatment_featurizer, discrete_instrument=False, # no instrument, so doesn't matter categories=categories, diff --git a/econml/dml/causal_forest.py b/econml/dml/causal_forest.py index 07a356d75..8faf157c2 100644 --- a/econml/dml/causal_forest.py +++ b/econml/dml/causal_forest.py @@ -649,7 +649,11 @@ def _gen_featurizer(self): def _gen_model_y(self): if self.model_y == 'auto': - model_y = WeightedLassoCVWrapper(random_state=self.random_state) + if self.binary_outcome: + model_y = LogisticRegressionCV(cv=WeightedStratifiedKFold(random_state=self.random_state), + random_state=self.random_state) + else: + model_y = WeightedLassoCVWrapper(random_state=self.random_state) else: model_y = clone(self.model_y, safe=False) return _FirstStageWrapper(model_y, True, self._gen_featurizer(), False, self.discrete_treatment) diff --git a/econml/dml/dml.py b/econml/dml/dml.py index 713554dad..286702a16 100644 --- a/econml/dml/dml.py +++ b/econml/dml/dml.py @@ -37,12 +37,20 @@ class _FirstStageWrapper: - def __init__(self, model, is_Y, featurizer, linear_first_stages, discrete_treatment): + def __init__( + self, + model, + is_Y, + featurizer, + linear_first_stages, + discrete_treatment, + binary_outcome): self._model = clone(model, safe=False) self._featurizer = clone(featurizer, safe=False) self._is_Y = is_Y self._linear_first_stages = linear_first_stages self._discrete_treatment = discrete_treatment + self._binary_outcome = binary_outcome def _combine(self, X, W, n_samples, fitting=True): if X is None: @@ -77,9 +85,13 @@ def fit(self, X, W, Target, sample_weight=None, groups=None): def predict(self, X, W): n_samples = X.shape[0] if X is not None else (W.shape[0] if W is not None else 1) - if (not self._is_Y) and self._discrete_treatment: + if (not self._is_Y and self._discrete_treatment) or (self._is_Y and self._binary_outcome): return self._model.predict_proba(self._combine(X, W, n_samples, fitting=False))[:, 1:] else: + if (not self._is_Y) and (not self._discrete_treatment) and hasattr(self._model, 'predict_proba'): + warn("A treatment model has a predict_proba method, but discrete_treatment=False. " + "If your treatment is discrete, consider setting discrete_treatment=True. " + "Otherwise, if your treatment is not discrete, use a regressor instead.", UserWarning) return self._model.predict(self._combine(X, W, n_samples, fitting=False)) def score(self, X, W, Target, sample_weight=None): @@ -461,6 +473,7 @@ def __init__(self, *, treatment_featurizer=None, fit_cate_intercept=True, linear_first_stages=False, + binary_outcome=False, discrete_treatment=False, categories='auto', cv=2, @@ -475,7 +488,8 @@ def __init__(self, *, self.model_y = clone(model_y, safe=False) self.model_t = clone(model_t, safe=False) self.model_final = clone(model_final, safe=False) - super().__init__(discrete_treatment=discrete_treatment, + super().__init__(binary_outcome=binary_outcome, + discrete_treatment=discrete_treatment, treatment_featurizer=treatment_featurizer, categories=categories, cv=cv, @@ -488,11 +502,15 @@ def _gen_featurizer(self): def _gen_model_y(self): if self.model_y == 'auto': - model_y = WeightedLassoCVWrapper(random_state=self.random_state) + if self.binary_outcome: + model_y = LogisticRegressionCV(cv=WeightedStratifiedKFold(random_state=self.random_state), + random_state=self.random_state) + else: + model_y = WeightedLassoCVWrapper(random_state=self.random_state) else: model_y = clone(self.model_y, safe=False) return _FirstStageWrapper(model_y, True, self._gen_featurizer(), - self.linear_first_stages, self.discrete_treatment) + self.linear_first_stages, self.discrete_treatment, self.binary_outcome) def _gen_model_t(self): if self.model_t == 'auto': @@ -504,7 +522,7 @@ def _gen_model_t(self): else: model_t = clone(self.model_t, safe=False) return _FirstStageWrapper(model_t, False, self._gen_featurizer(), - self.linear_first_stages, self.discrete_treatment) + self.linear_first_stages, self.discrete_treatment, self.binary_outcome) def _gen_model_final(self): return clone(self.model_final, safe=False) @@ -687,6 +705,7 @@ def __init__(self, *, treatment_featurizer=None, fit_cate_intercept=True, linear_first_stages=True, + binary_outcome=False, discrete_treatment=False, categories='auto', cv=2, @@ -700,6 +719,7 @@ def __init__(self, *, treatment_featurizer=treatment_featurizer, fit_cate_intercept=fit_cate_intercept, linear_first_stages=linear_first_stages, + binary_outcome=binary_outcome, discrete_treatment=discrete_treatment, categories=categories, cv=cv, @@ -927,6 +947,7 @@ def __init__(self, *, treatment_featurizer=None, fit_cate_intercept=True, linear_first_stages=True, + binary_outcome=False, discrete_treatment=False, categories='auto', cv=2, @@ -947,6 +968,7 @@ def __init__(self, *, treatment_featurizer=treatment_featurizer, fit_cate_intercept=fit_cate_intercept, linear_first_stages=linear_first_stages, + binary_outcome=binary_outcome, discrete_treatment=discrete_treatment, categories=categories, cv=cv, @@ -1131,6 +1153,7 @@ class KernelDML(DML): """ def __init__(self, model_y='auto', model_t='auto', + binary_outcome=False, discrete_treatment=False, treatment_featurizer=None, categories='auto', @@ -1148,6 +1171,7 @@ def __init__(self, model_y='auto', model_t='auto', featurizer=None, treatment_featurizer=treatment_featurizer, fit_cate_intercept=fit_cate_intercept, + binary_outcome=binary_outcome, discrete_treatment=discrete_treatment, categories=categories, cv=cv, @@ -1320,6 +1344,7 @@ class NonParamDML(_BaseDML): def __init__(self, *, model_y, model_t, model_final, featurizer=None, + binary_outcome=False, discrete_treatment=False, treatment_featurizer=None, categories='auto', @@ -1334,7 +1359,8 @@ def __init__(self, *, self.model_t = clone(model_t, safe=False) self.featurizer = clone(featurizer, safe=False) self.model_final = clone(model_final, safe=False) - super().__init__(discrete_treatment=discrete_treatment, + super().__init__(binary_outcome=binary_outcome, + discrete_treatment=discrete_treatment, treatment_featurizer=treatment_featurizer, categories=categories, cv=cv, @@ -1353,11 +1379,11 @@ def _gen_featurizer(self): def _gen_model_y(self): return _FirstStageWrapper(clone(self.model_y, safe=False), True, - self._gen_featurizer(), False, self.discrete_treatment) + self._gen_featurizer(), False, self.discrete_treatment, self.binary_outcome) def _gen_model_t(self): return _FirstStageWrapper(clone(self.model_t, safe=False), False, - self._gen_featurizer(), False, self.discrete_treatment) + self._gen_featurizer(), False, self.discrete_treatment, self.binary_outcome) def _gen_model_final(self): return clone(self.model_final, safe=False) diff --git a/econml/iv/dml/_dml.py b/econml/iv/dml/_dml.py index af0134ba3..f8b6c3df4 100644 --- a/econml/iv/dml/_dml.py +++ b/econml/iv/dml/_dml.py @@ -343,6 +343,7 @@ def __init__(self, *, projection=False, featurizer=None, fit_cate_intercept=True, + binary_outcome=False, discrete_treatment=False, treatment_featurizer=None, discrete_instrument=False, @@ -359,7 +360,8 @@ def __init__(self, *, self.featurizer = clone(featurizer, safe=False) self.fit_cate_intercept = fit_cate_intercept - super().__init__(discrete_instrument=discrete_instrument, + super().__init__(binary_outcome=binary_outcome, + discrete_instrument=discrete_instrument, discrete_treatment=discrete_treatment, treatment_featurizer=treatment_featurizer, categories=categories, @@ -379,7 +381,11 @@ def _gen_ortho_learner_model_final(self): def _gen_ortho_learner_model_nuisance(self): if self.model_y_xw == 'auto': - model_y_xw = WeightedLassoCVWrapper(random_state=self.random_state) + if self.binary_outcome: + model_y_xw = LogisticRegressionCV(cv=WeightedStratifiedKFold(random_state=self.random_state), + random_state=self.random_state) + else: + model_y_xw = WeightedLassoCVWrapper(random_state=self.random_state) else: model_y_xw = clone(self.model_y_xw, safe=False) @@ -404,11 +410,13 @@ def _gen_ortho_learner_model_nuisance(self): model_t_xwz = clone(self.model_t_xwz, safe=False) return _OrthoIVModelNuisance(_FirstStageWrapper(clone(model_y_xw, safe=False), True, - self._gen_featurizer(), False, False), + self._gen_featurizer(), False, False, self.binary_outcome), _FirstStageWrapper(clone(model_t_xw, safe=False), False, - self._gen_featurizer(), False, self.discrete_treatment), + self._gen_featurizer(), False, + self.discrete_treatment, self.binary_outcome), _FirstStageWrapper(clone(model_t_xwz, safe=False), False, - self._gen_featurizer(), False, self.discrete_treatment), + self._gen_featurizer(), False, + self.discrete_treatment, self.binary_outcome), self.projection) else: @@ -423,11 +431,13 @@ def _gen_ortho_learner_model_nuisance(self): model_z_xw = clone(self.model_z_xw, safe=False) return _OrthoIVModelNuisance(_FirstStageWrapper(clone(model_y_xw, safe=False), True, - self._gen_featurizer(), False, False), + self._gen_featurizer(), False, False, self.binary_outcome), _FirstStageWrapper(clone(model_t_xw, safe=False), False, - self._gen_featurizer(), False, self.discrete_treatment), + self._gen_featurizer(), False, + self.discrete_treatment, self.binary_outcome), _FirstStageWrapper(clone(model_z_xw, safe=False), False, - self._gen_featurizer(), False, self.discrete_instrument), + self._gen_featurizer(), False, + self.discrete_instrument, self.binary_outcome), self.projection) def fit(self, Y, T, *, Z, X=None, W=None, sample_weight=None, freq_weight=None, sample_var=None, groups=None, @@ -1142,6 +1152,7 @@ def __init__(self, *, model_final=StatsModelsLinearRegression(fit_intercept=False), featurizer=None, fit_cate_intercept=True, + binary_outcome=False, discrete_treatment=False, treatment_featurizer=None, discrete_instrument=False, @@ -1156,7 +1167,8 @@ def __init__(self, *, self.model_final = clone(model_final, safe=False) self.featurizer = clone(featurizer, safe=False) self.fit_cate_intercept = fit_cate_intercept - super().__init__(discrete_treatment=discrete_treatment, + super().__init__(binary_outcome=binary_outcome, + discrete_treatment=discrete_treatment, treatment_featurizer=treatment_featurizer, discrete_instrument=discrete_instrument, categories=categories, @@ -1170,11 +1182,15 @@ def _gen_featurizer(self): def _gen_model_y_xw(self): if self.model_y_xw == 'auto': - model_y_xw = WeightedLassoCVWrapper(random_state=self.random_state) + if self.binary_outcome: + model_y_xw = LogisticRegressionCV(cv=WeightedStratifiedKFold(random_state=self.random_state), + random_state=self.random_state) + else: + model_y_xw = WeightedLassoCVWrapper(random_state=self.random_state) else: model_y_xw = clone(self.model_y_xw, safe=False) return _FirstStageWrapper(model_y_xw, True, self._gen_featurizer(), - False, False) + False, False, self.binary_outcome) def _gen_model_t_xw(self): if self.model_t_xw == 'auto': @@ -1186,7 +1202,7 @@ def _gen_model_t_xw(self): else: model_t_xw = clone(self.model_t_xw, safe=False) return _FirstStageWrapper(model_t_xw, False, self._gen_featurizer(), - False, self.discrete_treatment) + False, self.discrete_treatment, self.binary_outcome) def _gen_model_t_xwz(self): if self.model_t_xwz == 'auto': @@ -1198,7 +1214,7 @@ def _gen_model_t_xwz(self): else: model_t_xwz = clone(self.model_t_xwz, safe=False) return _FirstStageWrapper(model_t_xwz, False, self._gen_featurizer(), - False, self.discrete_treatment) + False, self.discrete_treatment, self.binary_outcome) def _gen_model_final(self): return clone(self.model_final, safe=False) @@ -1532,6 +1548,7 @@ def __init__(self, *, model_t_xw="auto", model_t_xwz="auto", model_final, + binary_outcome=False, discrete_treatment=False, treatment_featurizer=None, discrete_instrument=False, @@ -1546,7 +1563,8 @@ def __init__(self, *, self.model_t_xwz = clone(model_t_xwz, safe=False) self.model_final = clone(model_final, safe=False) self.featurizer = clone(featurizer, safe=False) - super().__init__(discrete_treatment=discrete_treatment, + super().__init__(binary_outcome=binary_outcome, + discrete_treatment=discrete_treatment, discrete_instrument=discrete_instrument, treatment_featurizer=treatment_featurizer, categories=categories, @@ -1560,11 +1578,15 @@ def _gen_featurizer(self): def _gen_model_y_xw(self): if self.model_y_xw == 'auto': - model_y_xw = WeightedLassoCVWrapper(random_state=self.random_state) + if self.binary_outcome: + model_y_xw = LogisticRegressionCV(cv=WeightedStratifiedKFold(random_state=self.random_state), + random_state=self.random_state) + else: + model_y_xw = WeightedLassoCVWrapper(random_state=self.random_state) else: model_y_xw = clone(self.model_y_xw, safe=False) return _FirstStageWrapper(model_y_xw, True, self._gen_featurizer(), - False, False) + False, False, self.binary_outcome) def _gen_model_t_xw(self): if self.model_t_xw == 'auto': @@ -1576,7 +1598,7 @@ def _gen_model_t_xw(self): else: model_t_xw = clone(self.model_t_xw, safe=False) return _FirstStageWrapper(model_t_xw, False, self._gen_featurizer(), - False, self.discrete_treatment) + False, self.discrete_treatment, self.binary_outcome) def _gen_model_t_xwz(self): if self.model_t_xwz == 'auto': @@ -1588,7 +1610,7 @@ def _gen_model_t_xwz(self): else: model_t_xwz = clone(self.model_t_xwz, safe=False) return _FirstStageWrapper(model_t_xwz, False, self._gen_featurizer(), - False, self.discrete_treatment) + False, self.discrete_treatment, self.binary_outcome) def _gen_model_final(self): return clone(self.model_final, safe=False) diff --git a/econml/iv/dr/_dr.py b/econml/iv/dr/_dr.py index 6e3689453..b704e828c 100644 --- a/econml/iv/dr/_dr.py +++ b/econml/iv/dr/_dr.py @@ -301,6 +301,7 @@ def __init__(self, *, fit_cate_intercept=False, cov_clip=1e-3, opt_reweighted=False, + binary_outcome=False, discrete_instrument=False, discrete_treatment=False, treatment_featurizer=None, @@ -314,7 +315,8 @@ def __init__(self, *, self.fit_cate_intercept = fit_cate_intercept self.cov_clip = cov_clip self.opt_reweighted = opt_reweighted - super().__init__(discrete_instrument=discrete_instrument, + super().__init__(binary_outcome=binary_outcome, + discrete_instrument=discrete_instrument, discrete_treatment=discrete_treatment, treatment_featurizer=treatment_featurizer, categories=categories, @@ -550,6 +552,7 @@ def __init__(self, *, fit_cate_intercept=False, cov_clip=1e-3, opt_reweighted=False, + binary_outcome=False, discrete_instrument=False, discrete_treatment=False, treatment_featurizer=None, @@ -570,6 +573,7 @@ def __init__(self, *, fit_cate_intercept=fit_cate_intercept, cov_clip=cov_clip, opt_reweighted=opt_reweighted, + binary_outcome=binary_outcome, discrete_instrument=discrete_instrument, discrete_treatment=discrete_treatment, treatment_featurizer=treatment_featurizer, @@ -584,7 +588,11 @@ def _gen_prel_model_effect(self): def _gen_ortho_learner_model_nuisance(self): if self.model_y_xw == 'auto': - model_y_xw = WeightedLassoCVWrapper(random_state=self.random_state) + if self.binary_outcome: + model_y_xw = LogisticRegressionCV(cv=WeightedStratifiedKFold(random_state=self.random_state), + random_state=self.random_state) + else: + model_y_xw = WeightedLassoCVWrapper(random_state=self.random_state) else: model_y_xw = clone(self.model_y_xw, safe=False) @@ -614,14 +622,15 @@ def _gen_ortho_learner_model_nuisance(self): model_t_xwz = clone(self.model_t_xwz, safe=False) return _BaseDRIVModelNuisance(self._gen_prel_model_effect(), - _FirstStageWrapper(model_y_xw, True, self._gen_featurizer(), False, False), + _FirstStageWrapper(model_y_xw, True, self._gen_featurizer(), + False, False, self.binary_outcome), _FirstStageWrapper(model_t_xw, False, self._gen_featurizer(), - False, self.discrete_treatment), - # outcome is continuous since proj_t is probability + False, self.discrete_treatment, self.binary_outcome), + # target is continuous since proj_t is probability _FirstStageWrapper(model_tz_xw, False, self._gen_featurizer(), False, - False), + False, self.binary_outcome), _FirstStageWrapper(model_t_xwz, False, self._gen_featurizer(), - False, self.discrete_treatment), + False, self.discrete_treatment, self.binary_outcome), self.projection, self.discrete_treatment, self.discrete_instrument) else: @@ -644,13 +653,15 @@ def _gen_ortho_learner_model_nuisance(self): model_z_xw = clone(self.model_z_xw, safe=False) return _BaseDRIVModelNuisance(self._gen_prel_model_effect(), - _FirstStageWrapper(model_y_xw, True, self._gen_featurizer(), False, False), + _FirstStageWrapper(model_y_xw, True, self._gen_featurizer(), False, False, + self.binary_outcome), _FirstStageWrapper(model_t_xw, False, self._gen_featurizer(), - False, self.discrete_treatment), + False, self.discrete_treatment, self.binary_outcome), _FirstStageWrapper(model_tz_xw, False, self._gen_featurizer(), False, - self.discrete_treatment and self.discrete_instrument), + self.discrete_treatment and self.discrete_instrument, + self.binary_outcome), _FirstStageWrapper(model_z_xw, False, self._gen_featurizer(), - False, self.discrete_instrument), + False, self.discrete_instrument, self.binary_outcome), self.projection, self.discrete_treatment, self.discrete_instrument) @@ -838,6 +849,7 @@ def __init__(self, *, fit_cate_intercept=False, cov_clip=1e-3, opt_reweighted=False, + binary_outcome=False, discrete_instrument=False, discrete_treatment=False, treatment_featurizer=None, @@ -866,6 +878,7 @@ def __init__(self, *, fit_cate_intercept=fit_cate_intercept, cov_clip=cov_clip, opt_reweighted=opt_reweighted, + binary_outcome=binary_outcome, discrete_instrument=discrete_instrument, discrete_treatment=discrete_treatment, treatment_featurizer=treatment_featurizer, @@ -1301,6 +1314,7 @@ def __init__(self, *, fit_cate_intercept=True, cov_clip=1e-3, opt_reweighted=False, + binary_outcome=False, discrete_instrument=False, discrete_treatment=False, treatment_featurizer=None, @@ -1324,6 +1338,7 @@ def __init__(self, *, fit_cate_intercept=fit_cate_intercept, cov_clip=cov_clip, opt_reweighted=opt_reweighted, + binary_outcome=binary_outcome, discrete_instrument=discrete_instrument, discrete_treatment=discrete_treatment, treatment_featurizer=treatment_featurizer, @@ -1632,6 +1647,7 @@ def __init__(self, *, n_jobs=None, cov_clip=1e-3, opt_reweighted=False, + binary_outcome=False, discrete_instrument=False, discrete_treatment=False, treatment_featurizer=None, @@ -1662,6 +1678,7 @@ def __init__(self, *, fit_cate_intercept=fit_cate_intercept, cov_clip=cov_clip, opt_reweighted=opt_reweighted, + binary_outcome=binary_outcome, discrete_instrument=discrete_instrument, discrete_treatment=discrete_treatment, treatment_featurizer=treatment_featurizer, @@ -2040,6 +2057,7 @@ def __init__(self, *, verbose=0, cov_clip=1e-3, opt_reweighted=False, + binary_outcome=False, discrete_instrument=False, discrete_treatment=False, treatment_featurizer=None, @@ -2076,6 +2094,7 @@ def __init__(self, *, fit_cate_intercept=False, cov_clip=cov_clip, opt_reweighted=opt_reweighted, + binary_outcome=binary_outcome, discrete_instrument=discrete_instrument, discrete_treatment=discrete_treatment, treatment_featurizer=treatment_featurizer, @@ -2294,7 +2313,11 @@ def _gen_prel_model_effect(self): def _gen_ortho_learner_model_nuisance(self): if self.model_y_xw == 'auto': - model_y_xw = WeightedLassoCVWrapper(random_state=self.random_state) + if self.binary_outcome: + model_y_xw = LogisticRegressionCV(cv=WeightedStratifiedKFold(random_state=self.random_state), + random_state=self.random_state) + else: + model_y_xw = WeightedLassoCVWrapper(random_state=self.random_state) else: model_y_xw = clone(self.model_y_xw, safe=False) @@ -2312,11 +2335,13 @@ def _gen_ortho_learner_model_nuisance(self): raise ValueError("Only 'auto' or float is allowed!") return _IntentToTreatDRIVModelNuisance(_FirstStageWrapper(model_y_xw, True, self._gen_featurizer(), - False, False), + False, False, self.binary_outcome), _FirstStageWrapper(model_t_xwz, False, - self._gen_featurizer(), False, True), + self._gen_featurizer(), False, True, + self.binary_outcome), _FirstStageWrapper(dummy_z, False, - self._gen_featurizer(), False, True), + self._gen_featurizer(), False, True, + self.binary_outcome), self._gen_prel_model_effect() ) diff --git a/econml/panel/dml/_dml.py b/econml/panel/dml/_dml.py index a12385e36..2dde6dbe0 100644 --- a/econml/panel/dml/_dml.py +++ b/econml/panel/dml/_dml.py @@ -458,6 +458,7 @@ def __init__(self, *, featurizer=None, fit_cate_intercept=True, linear_first_stages=False, + binary_outcome=False, discrete_treatment=False, categories='auto', cv=2, @@ -469,7 +470,8 @@ def __init__(self, *, self.featurizer = clone(featurizer, safe=False) self.model_y = clone(model_y, safe=False) self.model_t = clone(model_t, safe=False) - super().__init__(discrete_treatment=discrete_treatment, + super().__init__(binary_outcome=binary_outcome, + discrete_treatment=discrete_treatment, treatment_featurizer=None, discrete_instrument=False, categories=categories, @@ -526,11 +528,15 @@ def _gen_featurizer(self): def _gen_model_y(self): if self.model_y == 'auto': - model_y = WeightedLassoCVWrapper(random_state=self.random_state) + if self.binary_outcome: + model_y = LogisticRegressionCV(cv=WeightedStratifiedKFold(random_state=self.random_state), + random_state=self.random_state) + else: + model_y = WeightedLassoCVWrapper(random_state=self.random_state) else: model_y = clone(self.model_y, safe=False) return _FirstStageWrapper(model_y, True, self._gen_featurizer(), - self.linear_first_stages, self.discrete_treatment) + self.linear_first_stages, self.discrete_treatment, self.binary_outcome) def _gen_model_t(self): if self.model_t == 'auto': @@ -542,7 +548,7 @@ def _gen_model_t(self): else: model_t = clone(self.model_t, safe=False) return _FirstStageWrapper(model_t, False, self._gen_featurizer(), - self.linear_first_stages, self.discrete_treatment) + self.linear_first_stages, self.discrete_treatment, self.binary_outcome) def _gen_model_final(self): return StatsModelsLinearRegression(fit_intercept=False) diff --git a/econml/tests/test_ortho_learner.py b/econml/tests/test_ortho_learner.py index 846d9facd..7927042d4 100644 --- a/econml/tests/test_ortho_learner.py +++ b/econml/tests/test_ortho_learner.py @@ -170,7 +170,7 @@ def _gen_ortho_learner_model_final(self): X = np.random.normal(size=(10000, 3)) sigma = 0.1 y = X[:, 0] + X[:, 1] + np.random.normal(0, sigma, size=(10000,)) - est = OrthoLearner(cv=2, discrete_treatment=False, treatment_featurizer=None, + est = OrthoLearner(cv=2, binary_outcome=False, discrete_treatment=False, treatment_featurizer=None, discrete_instrument=False, categories='auto', random_state=None) est.fit(y, X[:, 0], W=X[:, 1:]) np.testing.assert_almost_equal(est.const_marginal_effect(), 1, decimal=3) @@ -187,8 +187,8 @@ def _gen_ortho_learner_model_final(self): X = np.random.normal(size=(10000, 3)) sigma = 0.1 y = X[:, 0] + X[:, 1] + np.random.normal(0, sigma, size=(10000,)) - est = OrthoLearner(cv=2, discrete_treatment=False, treatment_featurizer=None, discrete_instrument=False, - categories='auto', random_state=None) + est = OrthoLearner(cv=2, binary_outcome=False, discrete_treatment=False, treatment_featurizer=None, + discrete_instrument=False, categories='auto', random_state=None) # test non-array inputs est.fit(list(y), list(X[:, 0]), X=None, W=X[:, 1:]) np.testing.assert_almost_equal(est.const_marginal_effect(), 1, decimal=3) @@ -268,8 +268,8 @@ def _gen_ortho_learner_model_final(self): X = np.random.normal(size=(10000, 3)) sigma = 0.1 y = X[:, 0] + X[:, 1] + np.random.normal(0, sigma, size=(10000,)) - est = OrthoLearner(cv=2, discrete_treatment=False, treatment_featurizer=None, discrete_instrument=False, - categories='auto', random_state=None) + est = OrthoLearner(cv=2, binary_outcome=False, discrete_treatment=False, treatment_featurizer=None, + discrete_instrument=False, categories='auto', random_state=None) est.fit(y, X[:, 0], W=X[:, 1:]) np.testing.assert_almost_equal(est.const_marginal_effect(), 1, decimal=3) np.testing.assert_array_almost_equal(est.effect(), np.ones(1), decimal=3) @@ -318,8 +318,8 @@ def _gen_ortho_learner_model_final(self): X = np.random.normal(size=(10000, 3)) sigma = 0.1 y = X[:, 0] + X[:, 1] + np.random.normal(0, sigma, size=(10000,)) - est = OrthoLearner(cv=2, discrete_treatment=False, treatment_featurizer=None, discrete_instrument=False, - categories='auto', random_state=None) + est = OrthoLearner(cv=2, binary_outcome=False, discrete_treatment=False, treatment_featurizer=None, + discrete_instrument=False, categories='auto', random_state=None) est.fit(y, X[:, 0], W=X[:, 1:]) np.testing.assert_almost_equal(est.const_marginal_effect(), 1, decimal=3) np.testing.assert_array_almost_equal(est.effect(), np.ones(1), decimal=3) @@ -380,8 +380,8 @@ def _gen_ortho_learner_model_final(self): T = np.random.binomial(1, scipy.special.expit(X[:, 0])) sigma = 0.01 y = T + X[:, 0] + np.random.normal(0, sigma, size=(10000,)) - est = OrthoLearner(cv=2, discrete_treatment=True, treatment_featurizer=None, discrete_instrument=False, - categories='auto', random_state=None) + est = OrthoLearner(cv=2, binary_outcome=False, discrete_treatment=True, treatment_featurizer=None, + discrete_instrument=False, categories='auto', random_state=None) est.fit(y, T, W=X) np.testing.assert_almost_equal(est.const_marginal_effect(), 1, decimal=3) np.testing.assert_array_almost_equal(est.effect(), np.ones(1), decimal=3) From 6bc066079f42c2bd56859f99d225b4224712e721 Mon Sep 17 00:00:00 2001 From: Fabio Vera Date: Mon, 25 Sep 2023 12:00:08 -0400 Subject: [PATCH 02/25] add init args to drlearner, causalforestdml Signed-off-by: Fabio Vera --- econml/dml/causal_forest.py | 4 +++- econml/dr/_drlearner.py | 8 ++++++++ 2 files changed, 11 insertions(+), 1 deletion(-) diff --git a/econml/dml/causal_forest.py b/econml/dml/causal_forest.py index 8faf157c2..bc30aa1d4 100644 --- a/econml/dml/causal_forest.py +++ b/econml/dml/causal_forest.py @@ -577,6 +577,7 @@ def __init__(self, *, model_t='auto', featurizer=None, treatment_featurizer=None, + binary_outcome=False, discrete_treatment=False, categories='auto', cv=2, @@ -630,7 +631,8 @@ def __init__(self, *, self.subforest_size = subforest_size self.n_jobs = n_jobs self.verbose = verbose - super().__init__(discrete_treatment=discrete_treatment, + super().__init__(binary_outcome=binary_outcome, + discrete_treatment=discrete_treatment, treatment_featurizer=treatment_featurizer, categories=categories, cv=cv, diff --git a/econml/dr/_drlearner.py b/econml/dr/_drlearner.py index 3ca702a0c..e4e264113 100644 --- a/econml/dr/_drlearner.py +++ b/econml/dr/_drlearner.py @@ -402,6 +402,7 @@ def __init__(self, *, model_propensity='auto', model_regression='auto', model_final=StatsModelsLinearRegression(), + binary_outcome=False, multitask_model_final=False, featurizer=None, min_propensity=1e-6, @@ -419,6 +420,7 @@ def __init__(self, *, super().__init__(cv=cv, mc_iters=mc_iters, mc_agg=mc_agg, + binary_outcome=binary_outcome, discrete_treatment=True, treatment_featurizer=None, # treatment featurization not supported with discrete treatment discrete_instrument=False, # no instrument, so doesn't matter @@ -864,6 +866,7 @@ class LinearDRLearner(StatsModelsCateEstimatorDiscreteMixin, DRLearner): def __init__(self, *, model_propensity='auto', model_regression='auto', + binary_outcome=False, featurizer=None, fit_cate_intercept=True, min_propensity=1e-6, @@ -876,6 +879,7 @@ def __init__(self, *, super().__init__(model_propensity=model_propensity, model_regression=model_regression, model_final=None, + binary_outcome=binary_outcome, featurizer=featurizer, multitask_model_final=False, min_propensity=min_propensity, @@ -1137,6 +1141,7 @@ def __init__(self, *, model_regression='auto', featurizer=None, fit_cate_intercept=True, + binary_outcome=False, alpha='auto', n_alphas=100, alpha_cov='auto', @@ -1161,6 +1166,7 @@ def __init__(self, *, super().__init__(model_propensity=model_propensity, model_regression=model_regression, model_final=None, + binary_outcome=binary_outcome, featurizer=featurizer, multitask_model_final=False, min_propensity=min_propensity, @@ -1413,6 +1419,7 @@ class ForestDRLearner(ForestModelFinalCateEstimatorDiscreteMixin, DRLearner): def __init__(self, *, model_regression="auto", model_propensity="auto", + binary_outcome=False, featurizer=None, min_propensity=1e-6, categories='auto', @@ -1449,6 +1456,7 @@ def __init__(self, *, super().__init__(model_regression=model_regression, model_propensity=model_propensity, model_final=None, + binary_outcome=binary_outcome, featurizer=featurizer, multitask_model_final=False, min_propensity=min_propensity, From 058c3e8b26cf5bc6e05f76b5d402bac9645dcb18 Mon Sep 17 00:00:00 2001 From: Fabio Vera Date: Mon, 25 Sep 2023 12:14:57 -0400 Subject: [PATCH 03/25] modify bootstrap test to use np array Signed-off-by: Fabio Vera --- econml/tests/test_bootstrap.py | 14 +++++++------- 1 file changed, 7 insertions(+), 7 deletions(-) diff --git a/econml/tests/test_bootstrap.py b/econml/tests/test_bootstrap.py index df15f9cdb..3145ef07b 100644 --- a/econml/tests/test_bootstrap.py +++ b/econml/tests/test_bootstrap.py @@ -270,8 +270,8 @@ def test_internal_options(self): def test_stratify(self): """Test that we can properly stratify by treatment""" - T = [1, 0, 1, 2, 0, 2] - Y = [1, 2, 3, 4, 5, 6] + T = np.array([1, 0, 1, 2, 0, 2]) + Y = np.array([1, 2, 3, 4, 5, 6]) X = np.array([1, 1, 2, 2, 1, 2]).reshape(-1, 1) est = LinearDML(model_y=LinearRegression(), model_t=LogisticRegression(), discrete_treatment=True) inference = BootstrapInference(n_bootstrap_samples=5, n_jobs=-1, verbose=0) @@ -286,9 +286,9 @@ def test_stratify(self): def test_stratify_orthoiv(self): """Test that we can properly stratify by treatment/instrument pair""" - T = [1, 0, 1, 1, 0, 0, 1, 0] - Z = [1, 0, 0, 1, 0, 1, 0, 1] - Y = [1, 2, 3, 4, 5, 6, 7, 8] + T = np.array([1, 0, 1, 1, 0, 0, 1, 0]) + Z = np.array([1, 0, 0, 1, 0, 1, 0, 1]) + Y = np.array([1, 2, 3, 4, 5, 6, 7, 8]) X = np.array([1, 1, 2, 2, 1, 2, 1, 2]).reshape(-1, 1) est = LinearIntentToTreatDRIV(model_y_xw=LinearRegression(), model_t_xwz=LogisticRegression(), flexible_model_effect=LinearRegression(), cv=2) @@ -297,8 +297,8 @@ def test_stratify_orthoiv(self): est.const_marginal_effect_interval(X) def test_all_kinds(self): - T = [1, 0, 1, 2, 0, 2] * 5 - Y = [1, 2, 3, 4, 5, 6] * 5 + T = np.array([1, 0, 1, 2, 0, 2] * 5) + Y = np.array([1, 2, 3, 4, 5, 6] * 5) X = np.array([1, 1, 2, 2, 1, 2] * 5).reshape(-1, 1) est = LinearDML(cv=2) for kind in ['percentile', 'pivot', 'normal']: From a92d140cbd484b9a5d9a6bb247e45316fb93b05d Mon Sep 17 00:00:00 2001 From: Fabio Vera Date: Mon, 25 Sep 2023 15:47:26 -0400 Subject: [PATCH 04/25] bugfix causalforest firststagewrapper Signed-off-by: Fabio Vera --- econml/dml/causal_forest.py | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/econml/dml/causal_forest.py b/econml/dml/causal_forest.py index bc30aa1d4..1b91d0e03 100644 --- a/econml/dml/causal_forest.py +++ b/econml/dml/causal_forest.py @@ -658,7 +658,8 @@ def _gen_model_y(self): model_y = WeightedLassoCVWrapper(random_state=self.random_state) else: model_y = clone(self.model_y, safe=False) - return _FirstStageWrapper(model_y, True, self._gen_featurizer(), False, self.discrete_treatment) + return _FirstStageWrapper(model_y, True, self._gen_featurizer(), False, + self.discrete_treatment, self.binary_outcome) def _gen_model_t(self): if self.model_t == 'auto': @@ -669,7 +670,8 @@ def _gen_model_t(self): model_t = WeightedLassoCVWrapper(random_state=self.random_state) else: model_t = clone(self.model_t, safe=False) - return _FirstStageWrapper(model_t, False, self._gen_featurizer(), False, self.discrete_treatment) + return _FirstStageWrapper(model_t, False, self._gen_featurizer(), False, + self.discrete_treatment, self.binary_outcome) def _gen_model_final(self): return MultiOutputGRF(CausalForest(n_estimators=self.n_estimators, From 8929eab4c9162b40f390e3d955212329ca519f1b Mon Sep 17 00:00:00 2001 From: Fabio Vera Date: Mon, 25 Sep 2023 16:17:20 -0400 Subject: [PATCH 05/25] fix test bug ortholearner Signed-off-by: Fabio Vera --- econml/tests/test_ortho_learner.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/econml/tests/test_ortho_learner.py b/econml/tests/test_ortho_learner.py index 7927042d4..6db27cc37 100644 --- a/econml/tests/test_ortho_learner.py +++ b/econml/tests/test_ortho_learner.py @@ -203,7 +203,7 @@ def _gen_ortho_learner_model_final(self): X = np.random.normal(size=(10000, 3)) sigma = 0.1 y = X[:, 0] + X[:, 1] + np.random.normal(0, sigma, size=(10000,)) - est = OrthoLearner(cv=KFold(n_splits=3), + est = OrthoLearner(cv=KFold(n_splits=3), binary_outcome=False, discrete_treatment=False, treatment_featurizer=None, discrete_instrument=False, categories='auto', random_state=None) est.fit(y, X[:, 0], X=None, W=X[:, 1:]) @@ -220,7 +220,7 @@ def _gen_ortho_learner_model_final(self): sigma = 0.1 y = X[:, 0] + X[:, 1] + np.random.normal(0, sigma, size=(10000,)) folds = [(np.arange(X.shape[0] // 2), np.arange(X.shape[0] // 2, X.shape[0]))] - est = OrthoLearner(cv=folds, discrete_treatment=False, treatment_featurizer=None, + est = OrthoLearner(cv=folds, binary_outcome=False, discrete_treatment=False, treatment_featurizer=None, discrete_instrument=False, categories='auto', random_state=None) est.fit(y, X[:, 0], X=None, W=X[:, 1:]) np.testing.assert_almost_equal(est.const_marginal_effect(), 1, decimal=2) From 1540a081ca6987c525f38f7df3d61a1a3d6577b4 Mon Sep 17 00:00:00 2001 From: Fabio Vera Date: Mon, 25 Sep 2023 17:08:22 -0400 Subject: [PATCH 06/25] fix test bugs treatfeat OL doctest Signed-off-by: Fabio Vera --- econml/_ortho_learner.py | 4 ++-- econml/tests/test_treatment_featurization.py | 1 + 2 files changed, 3 insertions(+), 2 deletions(-) diff --git a/econml/_ortho_learner.py b/econml/_ortho_learner.py index 498376f1d..84fde5f6e 100644 --- a/econml/_ortho_learner.py +++ b/econml/_ortho_learner.py @@ -342,7 +342,7 @@ def _gen_ortho_learner_model_final(self): np.random.seed(123) X = np.random.normal(size=(100, 3)) y = X[:, 0] + X[:, 1] + np.random.normal(0, 0.1, size=(100,)) - est = OrthoLearner(cv=2, discrete_treatment=False, treatment_featurizer=None, + est = OrthoLearner(cv=2, binary_outcome=False, discrete_treatment=False, treatment_featurizer=None, discrete_instrument=False, categories='auto', random_state=None) est.fit(y, X[:, 0], W=X[:, 1:]) @@ -400,7 +400,7 @@ def _gen_ortho_learner_model_final(self): import scipy.special T = np.random.binomial(1, scipy.special.expit(W[:, 0])) y = T + W[:, 0] + np.random.normal(0, 0.01, size=(100,)) - est = OrthoLearner(cv=2, discrete_treatment=True, discrete_instrument=False, + est = OrthoLearner(cv=2, binary_outcome=False, discrete_treatment=True, discrete_instrument=False, treatment_featurizer=None, categories='auto', random_state=None) est.fit(y, T, W=W) diff --git a/econml/tests/test_treatment_featurization.py b/econml/tests/test_treatment_featurization.py index a58bf5754..4310ac413 100644 --- a/econml/tests/test_treatment_featurization.py +++ b/econml/tests/test_treatment_featurization.py @@ -504,6 +504,7 @@ def _gen_ortho_learner_model_final(self): 'estimator': OrthoLearner, 'params': { 'cv': 2, + 'binary_outcome': False, 'discrete_treatment': False, 'treatment_featurizer': None, 'discrete_instrument': False, From d39a0910696481107f9c27ebd02e52b2a648b18e Mon Sep 17 00:00:00 2001 From: Fabio Vera Date: Wed, 11 Oct 2023 11:05:23 -0400 Subject: [PATCH 07/25] add tests, allow str y, add warnings/errors Signed-off-by: Fabio Vera --- econml/_ortho_learner.py | 19 +++- econml/dml/dml.py | 13 ++- econml/dr/_drlearner.py | 24 +++-- econml/tests/test_binary_outcome.py | 161 ++++++++++++++++++++++++++++ 4 files changed, 206 insertions(+), 11 deletions(-) create mode 100644 econml/tests/test_binary_outcome.py diff --git a/econml/_ortho_learner.py b/econml/_ortho_learner.py index 84fde5f6e..3536c4925 100644 --- a/econml/_ortho_learner.py +++ b/econml/_ortho_learner.py @@ -639,6 +639,18 @@ def fit(self, Y, T, *, X=None, W=None, Z=None, sample_weight=None, freq_weight=N if not only_final: + if self.binary_outcome: + self.outcome_transformer = LabelEncoder() + self.outcome_transformer.fit(Y) + if Y.shape[1:] and Y.shape[1] > 1: + raise ValueError( + f"Only one outcome variable is supported when binary_outcome=True. Got Y of shape {Y.shape}") + if len(self.outcome_transformer.classes_) > 2: + raise AttributeError( + "More than 2 outcome classes detected. This method currently only supports binary outcomes") + else: + self.outcome_transformer = None + if self.discrete_treatment: categories = self.categories if categories != 'auto': @@ -781,7 +793,7 @@ def refit_final(self, inference=None): def _fit_nuisances(self, Y, T, X=None, W=None, Z=None, sample_weight=None, groups=None): # use a binary array to get stratified split in case of discrete treatment - stratify = self.discrete_treatment or self.discrete_instrument + stratify = self.discrete_treatment or self.discrete_instrument or self.binary_outcome strata = self._strata(Y, T, X=X, W=W, Z=Z, sample_weight=sample_weight, groups=groups) if strata is None: strata = T # always safe to pass T as second arg to split even if we're not actually stratifying @@ -794,6 +806,9 @@ def _fit_nuisances(self, Y, T, X=None, W=None, Z=None, sample_weight=None, group if self.discrete_instrument: Z = self.z_transformer.transform(reshape(Z, (-1, 1))) + if self.binary_outcome: + Y = self.outcome_transformer.transform(Y) + if self.cv == 1: # special case, no cross validation folds = None else: @@ -912,6 +927,8 @@ def score(self, Y, T, X=None, W=None, Z=None, sample_weight=None, groups=None): X, T = self._expand_treatments(X, T) if self.z_transformer is not None: Z = self.z_transformer.transform(reshape(Z, (-1, 1))) + if self.binary_outcome: + Y = self.outcome_transformer.transform(Y) n_iters = len(self._models_nuisance) n_splits = len(self._models_nuisance[0]) diff --git a/econml/dml/dml.py b/econml/dml/dml.py index 286702a16..f67b01164 100644 --- a/econml/dml/dml.py +++ b/econml/dml/dml.py @@ -88,10 +88,15 @@ def predict(self, X, W): if (not self._is_Y and self._discrete_treatment) or (self._is_Y and self._binary_outcome): return self._model.predict_proba(self._combine(X, W, n_samples, fitting=False))[:, 1:] else: - if (not self._is_Y) and (not self._discrete_treatment) and hasattr(self._model, 'predict_proba'): - warn("A treatment model has a predict_proba method, but discrete_treatment=False. " - "If your treatment is discrete, consider setting discrete_treatment=True. " - "Otherwise, if your treatment is not discrete, use a regressor instead.", UserWarning) + if hasattr(self._model, 'predict_proba'): + if (not self._is_Y): + warn("A treatment model has a predict_proba method, but discrete_treatment=False. " + "If your treatment is discrete, consider setting discrete_treatment=True. " + "Otherwise, if your treatment is not discrete, use a regressor instead.", UserWarning) + elif (self._is_Y): + warn("An outcome model has a predict_proba method, but binary_outcome=False. " + "If your outcome is binary, consider setting binary_outcome=True. " + "Otherwise, if your outcome is not binary, use a regressor instead.", UserWarning) return self._model.predict(self._combine(X, W, n_samples, fitting=False)) def score(self, X, W, Target, sample_weight=None): diff --git a/econml/dr/_drlearner.py b/econml/dr/_drlearner.py index e4e264113..d42a32f40 100644 --- a/econml/dr/_drlearner.py +++ b/econml/dr/_drlearner.py @@ -51,16 +51,18 @@ from ..grf import RegressionForest from ..sklearn_extensions.linear_model import ( DebiasedLasso, StatsModelsLinearRegression, WeightedLassoCVWrapper) +from ..sklearn_extensions.model_selection import WeightedStratifiedKFold from ..utilities import (_deprecate_positional, check_high_dimensional, filter_none_kwargs, fit_with_groups, inverse_onehot, get_feature_names_or_default) from .._shap import _shap_explain_multitask_model_cate, _shap_explain_model_cate class _ModelNuisance: - def __init__(self, model_propensity, model_regression, min_propensity): + def __init__(self, model_propensity, model_regression, min_propensity, binary_outcome): self._model_propensity = model_propensity self._model_regression = model_regression self._min_propensity = min_propensity + self._binary_outcome = binary_outcome def _combine(self, X, W): return np.hstack([arr for arr in [X, W] if arr is not None]) @@ -102,12 +104,18 @@ def predict(self, Y, T, X=None, W=None, *, sample_weight=None, groups=None): n = T.shape[0] Y_pred = np.zeros((T.shape[0], T.shape[1] + 1)) T_counter = np.zeros(T.shape) - Y_pred[:, 0] = self._model_regression.predict(np.hstack([XW, T_counter])).reshape(n) + if self._binary_outcome and hasattr(self._model_regression, 'predict_proba'): + Y_pred[:, 0] = self._model_regression.predict_proba(np.hstack([XW, T_counter]))[:, 1].reshape(n) + else: + Y_pred[:, 0] = self._model_regression.predict(np.hstack([XW, T_counter])).reshape(n) Y_pred[:, 0] += (Y.reshape(n) - Y_pred[:, 0]) * np.all(T == 0, axis=1) / propensities[:, 0] for t in np.arange(T.shape[1]): T_counter = np.zeros(T.shape) T_counter[:, t] = 1 - Y_pred[:, t + 1] = self._model_regression.predict(np.hstack([XW, T_counter])).reshape(n) + if self._binary_outcome and hasattr(self._model_regression, 'predict_proba'): + Y_pred[:, t + 1] = self._model_regression.predict_proba(np.hstack([XW, T_counter]))[:, 1].reshape(n) + else: + Y_pred[:, t + 1] = self._model_regression.predict(np.hstack([XW, T_counter])).reshape(n) Y_pred[:, t + 1] += (Y.reshape(n) - Y_pred[:, t + 1]) * (T[:, t] == 1) / propensities[:, t + 1] T_complete = np.hstack(((np.all(T == 0, axis=1) * 1).reshape(-1, 1), T)) propensities_weight = np.sum(propensities * T_complete, axis=1) @@ -486,11 +494,15 @@ def _gen_ortho_learner_model_nuisance(self): model_propensity = clone(self.model_propensity, safe=False) if self.model_regression == 'auto': - model_regression = WeightedLassoCVWrapper(cv=3, random_state=self.random_state) + if self.binary_outcome: + model_regression = LogisticRegressionCV(cv=WeightedStratifiedKFold(random_state=self.random_state), + random_state=self.random_state) + else: + model_regression = WeightedLassoCVWrapper(cv=3, random_state=self.random_state) else: - model_regression = clone(self.model_regression, safe=False) + model_regression = clone(self.model_y, safe=False) - return _ModelNuisance(model_propensity, model_regression, self.min_propensity) + return _ModelNuisance(model_propensity, model_regression, self.min_propensity, self.binary_outcome) def _gen_featurizer(self): return clone(self.featurizer, safe=False) diff --git a/econml/tests/test_binary_outcome.py b/econml/tests/test_binary_outcome.py new file mode 100644 index 000000000..8188e92d1 --- /dev/null +++ b/econml/tests/test_binary_outcome.py @@ -0,0 +1,161 @@ +# Copyright (c) PyWhy contributors. All rights reserved. +# Licensed under the MIT License. +import pytest +import unittest +import numpy as np +from sklearn.preprocessing import PolynomialFeatures +from sklearn.linear_model import LinearRegression, LogisticRegression +from sklearn.ensemble import RandomForestRegressor +from joblib import Parallel, delayed + +from econml._ortho_learner import _OrthoLearner +from econml.dml import LinearDML, SparseLinearDML, KernelDML, CausalForestDML, NonParamDML +from econml.dr import LinearDRLearner +from econml.iv.dml import OrthoIV, DMLIV, NonParamDMLIV +from econml.iv.dr import DRIV, LinearDRIV, SparseLinearDRIV, ForestDRIV +from econml.orf import DMLOrthoForest + +from econml.utilities import filter_none_kwargs +from copy import deepcopy + + +class TestBinaryOutcome(unittest.TestCase): + # accuracy test + def test_accuracy(): + n = 1000 + binary_outcome = True + discrete_treatment = True + true_ate = 0.3 + W = np.random.uniform(-1, 1, size=(n, 1)) + D = np.random.binomial(1, .5 + .1 * W[:, 0], size=(n,)) + Y = np.random.binomial(1, .5 + true_ate * D + .1 * W[:, 0], size=(n,)) + + ests = [ + LinearDML(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment), + CausalForestDML(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment), + LinearDRLearner(binary_outcome=binary_outcome) + ] + + for est in ests: + + if isinstance(est, CausalForestDML): + est.fit(Y, D, X=W) + ate = est.ate(X=W) + ate_lb, ate_ub = est.ate_interval(X=W) + + else: + est.fit(Y, D, W=W) + ate = est.ate() + ate_lb, ate_ub = est.ate_interval() + + if isinstance(est, LinearDRLearner): + est.summary(T=1) + else: + est.summary() + + proportion_in_interval = ((ate_lb < true_ate) & (true_ate < ate_ub)).mean() + np.testing.assert_array_less(0.50, proportion_in_interval) + + +# accuracy test, DML +def test_accuracy_iv(): + n = 10000 + binary_outcome = True + discrete_treatment = True + true_ate = 0.3 + W = np.random.uniform(-1, 1, size=(n, 1)) + Z = np.random.uniform(-1, 1, size=(n, 1)) + D = np.random.binomial(1, .5 + .1 * W[:, 0] + .1 * Z[:, 0], size=(n,)) + Y = np.random.binomial(1, .5 + true_ate * D + .1 * W[:, 0], size=(n,)) + + ests = [ + OrthoIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment), + LinearDRIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment), + ] + + for est in ests: + + est.fit(Y, D, W=W, Z=Z) + ate = est.ate() + ate_lb, ate_ub = est.ate_interval() + + est.summary() + + proportion_in_interval = ((ate_lb < true_ate) & (true_ate < ate_ub)).mean() + np.testing.assert_array_less(0.50, proportion_in_interval) + + +def test_string_outcome(): + n = 100 + true_ate = 0.3 + W = np.random.uniform(-1, 1, size=(n, 1)) + D = np.random.binomial(1, .5 + .1 * W[:, 0], size=(n,)) + Y = np.random.binomial(1, .5 + true_ate * D + .1 * W[:, 0], size=(n,)) + Y_str = pd.Series(Y).replace(0, 'a').replace(1, 'b').values + est = LinearDML(binary_outcome=True, discrete_treatment=True) + est.fit(Y_str, D, X=W) + + +def test_basic_functionality(): + n = 100 + binary_outcome = True + d_x = 3 + + def gen_array(n, is_binary, d): + sz = (n, d) if d > 0 else (n,) + + if is_binary: + return np.random.choice([0, 1], size=sz) + else: + return np.random.normal(size=sz) + + for discrete_treatment in [True, False]: + for discrete_instrument in [True, False, None]: + + Y = gen_array(n, binary_outcome, d=0) + T = gen_array(n, discrete_treatment, d=0) + Z = None + if discrete_instrument is not None: + Z = gen_array(n, discrete_instrument, d=0) + X = gen_array(n, is_binary=False, d=3) + + if Z is not None: + est_list = [ + DRIV(binary_outcome=binary_outcome), + DMLIV(binary_outcome=binary_outcome), + OrthoIV(binary_outcome=binary_outcome), + ] + + else: + est_list = [ + LinearDML(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment), + CausalForestDML(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment) + ] + + if discrete_treatment: + est_list += [ + LinearDRLearner(binary_outcome=binary_outcome), + ] + + for est in est_list: + print(est) + est.fit(Y, T, **filter_none_kwargs(X=X, Z=Z)) + est.score(Y, T, **filter_none_kwargs(X=X, Z=Z)) + est.effect(X=X) + est.const_marginal_effect(X=X) + est.marginal_effect(T, X=X) + est.ate(X=X) + + # make sure the auto outcome model is a classifier + if hasattr(est, 'model_y'): + outcome_model_attr = 'models_y' + elif hasattr(est, 'model_regression'): + outcome_model_attr = 'models_regression' + elif hasattr(est, 'model_y_xw'): + outcome_model_attr = 'models_y_xw' + assert ( + hasattr( + getattr(est, outcome_model_attr)[0][0], + 'predict_proba' + ) + ), 'Auto outcome model is not a classifier!' From ee64b0e4005bc7c867cec747f8f82e0ba27c08c3 Mon Sep 17 00:00:00 2001 From: Fabio Vera Date: Fri, 27 Oct 2023 11:41:03 -0400 Subject: [PATCH 08/25] bugfixes Signed-off-by: Fabio Vera --- econml/dr/_drlearner.py | 2 +- econml/tests/test_binary_outcome.py | 9 +++++---- econml/tests/test_missing_values.py | 5 +++-- 3 files changed, 9 insertions(+), 7 deletions(-) diff --git a/econml/dr/_drlearner.py b/econml/dr/_drlearner.py index d61f3e698..badb94a33 100644 --- a/econml/dr/_drlearner.py +++ b/econml/dr/_drlearner.py @@ -509,7 +509,7 @@ def _gen_ortho_learner_model_nuisance(self): else: model_regression = WeightedLassoCVWrapper(cv=3, random_state=self.random_state) else: - model_regression = clone(self.model_y, safe=False) + model_regression = clone(self.model_regression, safe=False) return _ModelNuisance(model_propensity, model_regression, self.min_propensity, self.binary_outcome) diff --git a/econml/tests/test_binary_outcome.py b/econml/tests/test_binary_outcome.py index 8188e92d1..a69b008e0 100644 --- a/econml/tests/test_binary_outcome.py +++ b/econml/tests/test_binary_outcome.py @@ -3,6 +3,7 @@ import pytest import unittest import numpy as np +import pandas as pd from sklearn.preprocessing import PolynomialFeatures from sklearn.linear_model import LinearRegression, LogisticRegression from sklearn.ensemble import RandomForestRegressor @@ -21,7 +22,7 @@ class TestBinaryOutcome(unittest.TestCase): # accuracy test - def test_accuracy(): + def test_accuracy(self): n = 1000 binary_outcome = True discrete_treatment = True @@ -58,7 +59,7 @@ def test_accuracy(): # accuracy test, DML -def test_accuracy_iv(): +def test_accuracy_iv(self): n = 10000 binary_outcome = True discrete_treatment = True @@ -85,7 +86,7 @@ def test_accuracy_iv(): np.testing.assert_array_less(0.50, proportion_in_interval) -def test_string_outcome(): +def test_string_outcome(self): n = 100 true_ate = 0.3 W = np.random.uniform(-1, 1, size=(n, 1)) @@ -96,7 +97,7 @@ def test_string_outcome(): est.fit(Y_str, D, X=W) -def test_basic_functionality(): +def test_basic_functionality(self): n = 100 binary_outcome = True d_x = 3 diff --git a/econml/tests/test_missing_values.py b/econml/tests/test_missing_values.py index 2ae355983..569a6d977 100644 --- a/econml/tests/test_missing_values.py +++ b/econml/tests/test_missing_values.py @@ -123,8 +123,9 @@ def test_missing(self): # model that can handle missing values nuisance_model = make_pipeline(SimpleImputer(strategy='mean'), LinearRegression()) - OrthoLearner(discrete_treatment=False, treatment_featurizer=None, discrete_instrument=None, - categories='auto', cv=3, random_state=1, allow_missing=True).fit(y, T, W=W_missing) + OrthoLearner(binary_outcome=False, discrete_treatment=False, treatment_featurizer=None, + discrete_instrument=None, categories='auto', cv=3, random_state=1, + allow_missing=True).fit(y, T, W=W_missing) CausalForestDML(model_y=nuisance_model, model_t=nuisance_model, allow_missing=True).fit(y, T, X=X, W=W_missing) From 5aaee9d43d9eac5e7342ef49d7d307008712fd6b Mon Sep 17 00:00:00 2001 From: Fabio Vera Date: Fri, 27 Oct 2023 11:56:26 -0400 Subject: [PATCH 09/25] linting Signed-off-by: Fabio Vera --- econml/iv/dr/_dr.py | 16 ++-------------- 1 file changed, 2 insertions(+), 14 deletions(-) diff --git a/econml/iv/dr/_dr.py b/econml/iv/dr/_dr.py index 76a6c419c..6d37f5764 100644 --- a/econml/iv/dr/_dr.py +++ b/econml/iv/dr/_dr.py @@ -679,21 +679,9 @@ def _gen_ortho_learner_model_nuisance(self): else: model_t_xwz = clone(self.model_t_xwz, safe=False) - return _BaseDRIVModelNuisance(self._gen_prel_model_effect(), - _FirstStageWrapper(model_y_xw, True, self._gen_featurizer(), - False, False, self.binary_outcome), - _FirstStageWrapper(model_t_xw, False, self._gen_featurizer(), - False, self.discrete_treatment, self.binary_outcome), - # target is continuous since proj_t is probability - _FirstStageWrapper(model_tz_xw, False, self._gen_featurizer(), False, - False, self.binary_outcome), - _FirstStageWrapper(model_t_xwz, False, self._gen_featurizer(), - False, self.discrete_treatment, self.binary_outcome), - self.projection, self.discrete_treatment, self.discrete_instrument) - return _BaseDRIVModelNuisance(prel_model_effect=self._gen_prel_model_effect(), model_y_xw=_FirstStageWrapper( - model_y_xw, True, self._gen_featurizer(), + model_y_xw, True, self._gen_featurizer(), False, False, self.binary_outcome), model_t_xw=_FirstStageWrapper(model_t_xw, False, self._gen_featurizer(), False, self.discrete_treatment, @@ -730,7 +718,7 @@ def _gen_ortho_learner_model_nuisance(self): return _BaseDRIVModelNuisance(prel_model_effect=self._gen_prel_model_effect(), model_y_xw=_FirstStageWrapper( - model_y_xw, True, self._gen_featurizer(), + model_y_xw, True, self._gen_featurizer(), False, False, self.binary_outcome), model_t_xw=_FirstStageWrapper(model_t_xw, False, self._gen_featurizer(), False, self.discrete_treatment, From 9064f8ba411f5278456cc5f5c475a4e7182c8ec6 Mon Sep 17 00:00:00 2001 From: Fabio Vera Date: Fri, 27 Oct 2023 12:56:00 -0400 Subject: [PATCH 10/25] indent Signed-off-by: Fabio Vera --- econml/tests/test_binary_outcome.py | 196 ++++++++++++++-------------- 1 file changed, 98 insertions(+), 98 deletions(-) diff --git a/econml/tests/test_binary_outcome.py b/econml/tests/test_binary_outcome.py index a69b008e0..d68eb0b30 100644 --- a/econml/tests/test_binary_outcome.py +++ b/econml/tests/test_binary_outcome.py @@ -58,105 +58,105 @@ def test_accuracy(self): np.testing.assert_array_less(0.50, proportion_in_interval) -# accuracy test, DML -def test_accuracy_iv(self): - n = 10000 - binary_outcome = True - discrete_treatment = True - true_ate = 0.3 - W = np.random.uniform(-1, 1, size=(n, 1)) - Z = np.random.uniform(-1, 1, size=(n, 1)) - D = np.random.binomial(1, .5 + .1 * W[:, 0] + .1 * Z[:, 0], size=(n,)) - Y = np.random.binomial(1, .5 + true_ate * D + .1 * W[:, 0], size=(n,)) - - ests = [ - OrthoIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment), - LinearDRIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment), - ] - - for est in ests: - - est.fit(Y, D, W=W, Z=Z) - ate = est.ate() - ate_lb, ate_ub = est.ate_interval() - - est.summary() - - proportion_in_interval = ((ate_lb < true_ate) & (true_ate < ate_ub)).mean() - np.testing.assert_array_less(0.50, proportion_in_interval) - - -def test_string_outcome(self): - n = 100 - true_ate = 0.3 - W = np.random.uniform(-1, 1, size=(n, 1)) - D = np.random.binomial(1, .5 + .1 * W[:, 0], size=(n,)) - Y = np.random.binomial(1, .5 + true_ate * D + .1 * W[:, 0], size=(n,)) - Y_str = pd.Series(Y).replace(0, 'a').replace(1, 'b').values - est = LinearDML(binary_outcome=True, discrete_treatment=True) - est.fit(Y_str, D, X=W) - - -def test_basic_functionality(self): - n = 100 - binary_outcome = True - d_x = 3 - - def gen_array(n, is_binary, d): - sz = (n, d) if d > 0 else (n,) - - if is_binary: - return np.random.choice([0, 1], size=sz) - else: - return np.random.normal(size=sz) - - for discrete_treatment in [True, False]: - for discrete_instrument in [True, False, None]: - - Y = gen_array(n, binary_outcome, d=0) - T = gen_array(n, discrete_treatment, d=0) - Z = None - if discrete_instrument is not None: - Z = gen_array(n, discrete_instrument, d=0) - X = gen_array(n, is_binary=False, d=3) - - if Z is not None: - est_list = [ - DRIV(binary_outcome=binary_outcome), - DMLIV(binary_outcome=binary_outcome), - OrthoIV(binary_outcome=binary_outcome), - ] + # accuracy test, DML + def test_accuracy_iv(self): + n = 10000 + binary_outcome = True + discrete_treatment = True + true_ate = 0.3 + W = np.random.uniform(-1, 1, size=(n, 1)) + Z = np.random.uniform(-1, 1, size=(n, 1)) + D = np.random.binomial(1, .5 + .1 * W[:, 0] + .1 * Z[:, 0], size=(n,)) + Y = np.random.binomial(1, .5 + true_ate * D + .1 * W[:, 0], size=(n,)) + + ests = [ + OrthoIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment), + LinearDRIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment), + ] + + for est in ests: + + est.fit(Y, D, W=W, Z=Z) + ate = est.ate() + ate_lb, ate_ub = est.ate_interval() + est.summary() + + proportion_in_interval = ((ate_lb < true_ate) & (true_ate < ate_ub)).mean() + np.testing.assert_array_less(0.50, proportion_in_interval) + + + def test_string_outcome(self): + n = 100 + true_ate = 0.3 + W = np.random.uniform(-1, 1, size=(n, 1)) + D = np.random.binomial(1, .5 + .1 * W[:, 0], size=(n,)) + Y = np.random.binomial(1, .5 + true_ate * D + .1 * W[:, 0], size=(n,)) + Y_str = pd.Series(Y).replace(0, 'a').replace(1, 'b').values + est = LinearDML(binary_outcome=True, discrete_treatment=True) + est.fit(Y_str, D, X=W) + + + def test_basic_functionality(self): + n = 100 + binary_outcome = True + d_x = 3 + + def gen_array(n, is_binary, d): + sz = (n, d) if d > 0 else (n,) + + if is_binary: + return np.random.choice([0, 1], size=sz) else: - est_list = [ - LinearDML(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment), - CausalForestDML(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment) - ] - - if discrete_treatment: - est_list += [ - LinearDRLearner(binary_outcome=binary_outcome), + return np.random.normal(size=sz) + + for discrete_treatment in [True, False]: + for discrete_instrument in [True, False, None]: + + Y = gen_array(n, binary_outcome, d=0) + T = gen_array(n, discrete_treatment, d=0) + Z = None + if discrete_instrument is not None: + Z = gen_array(n, discrete_instrument, d=0) + X = gen_array(n, is_binary=False, d=3) + + if Z is not None: + est_list = [ + DRIV(binary_outcome=binary_outcome), + DMLIV(binary_outcome=binary_outcome), + OrthoIV(binary_outcome=binary_outcome), + ] + + else: + est_list = [ + LinearDML(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment), + CausalForestDML(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment) ] - for est in est_list: - print(est) - est.fit(Y, T, **filter_none_kwargs(X=X, Z=Z)) - est.score(Y, T, **filter_none_kwargs(X=X, Z=Z)) - est.effect(X=X) - est.const_marginal_effect(X=X) - est.marginal_effect(T, X=X) - est.ate(X=X) - - # make sure the auto outcome model is a classifier - if hasattr(est, 'model_y'): - outcome_model_attr = 'models_y' - elif hasattr(est, 'model_regression'): - outcome_model_attr = 'models_regression' - elif hasattr(est, 'model_y_xw'): - outcome_model_attr = 'models_y_xw' - assert ( - hasattr( - getattr(est, outcome_model_attr)[0][0], - 'predict_proba' - ) - ), 'Auto outcome model is not a classifier!' + if discrete_treatment: + est_list += [ + LinearDRLearner(binary_outcome=binary_outcome), + ] + + for est in est_list: + print(est) + est.fit(Y, T, **filter_none_kwargs(X=X, Z=Z)) + est.score(Y, T, **filter_none_kwargs(X=X, Z=Z)) + est.effect(X=X) + est.const_marginal_effect(X=X) + est.marginal_effect(T, X=X) + est.ate(X=X) + + # make sure the auto outcome model is a classifier + if hasattr(est, 'model_y'): + outcome_model_attr = 'models_y' + elif hasattr(est, 'model_regression'): + outcome_model_attr = 'models_regression' + elif hasattr(est, 'model_y_xw'): + outcome_model_attr = 'models_y_xw' + assert ( + hasattr( + getattr(est, outcome_model_attr)[0][0], + 'predict_proba' + ) + ), 'Auto outcome model is not a classifier!' From c98edbc4f56fa6b1b0f018bcd5f0dd23e03c04fb Mon Sep 17 00:00:00 2001 From: Fabio Vera Date: Fri, 27 Oct 2023 12:56:40 -0400 Subject: [PATCH 11/25] linting Signed-off-by: Fabio Vera --- econml/tests/test_binary_outcome.py | 3 --- 1 file changed, 3 deletions(-) diff --git a/econml/tests/test_binary_outcome.py b/econml/tests/test_binary_outcome.py index d68eb0b30..ccf42bd24 100644 --- a/econml/tests/test_binary_outcome.py +++ b/econml/tests/test_binary_outcome.py @@ -57,7 +57,6 @@ def test_accuracy(self): proportion_in_interval = ((ate_lb < true_ate) & (true_ate < ate_ub)).mean() np.testing.assert_array_less(0.50, proportion_in_interval) - # accuracy test, DML def test_accuracy_iv(self): n = 10000 @@ -85,7 +84,6 @@ def test_accuracy_iv(self): proportion_in_interval = ((ate_lb < true_ate) & (true_ate < ate_ub)).mean() np.testing.assert_array_less(0.50, proportion_in_interval) - def test_string_outcome(self): n = 100 true_ate = 0.3 @@ -96,7 +94,6 @@ def test_string_outcome(self): est = LinearDML(binary_outcome=True, discrete_treatment=True) est.fit(Y_str, D, X=W) - def test_basic_functionality(self): n = 100 binary_outcome = True From 1ff950527ba19d7dd1f763d986678226e2ad3a9b Mon Sep 17 00:00:00 2001 From: Fabio Vera Date: Thu, 9 Nov 2023 13:46:30 -0500 Subject: [PATCH 12/25] rlearner doctest Signed-off-by: Fabio Vera --- econml/dml/_rlearner.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/econml/dml/_rlearner.py b/econml/dml/_rlearner.py index 02b6ec879..48a703a25 100644 --- a/econml/dml/_rlearner.py +++ b/econml/dml/_rlearner.py @@ -227,7 +227,7 @@ def _gen_rlearner_model_final(self): np.random.seed(123) X = np.random.normal(size=(1000, 3)) y = X[:, 0] + X[:, 1] + np.random.normal(0, 0.01, size=(1000,)) - est = RLearner(cv=2, discrete_treatment=False, + est = RLearner(cv=2, binary_outcome=False, discrete_treatment=False, treatment_featurizer=None, categories='auto', random_state=None) est.fit(y, X[:, 0], X=np.ones((X.shape[0], 1)), W=X[:, 1:]) From a67eb544d1698cccff444d886a7355ae53024080 Mon Sep 17 00:00:00 2001 From: Fabio Vera Date: Thu, 7 Dec 2023 14:09:42 -0500 Subject: [PATCH 13/25] linting Signed-off-by: Fabio Vera --- econml/dml/_rlearner.py | 27 +++++++++++++-------------- econml/iv/dml/_dml.py | 3 --- econml/iv/dr/_dr.py | 4 +++- econml/panel/dml/_dml.py | 4 +++- 4 files changed, 19 insertions(+), 19 deletions(-) diff --git a/econml/dml/_rlearner.py b/econml/dml/_rlearner.py index 889409bb6..27932fd2c 100644 --- a/econml/dml/_rlearner.py +++ b/econml/dml/_rlearner.py @@ -290,20 +290,19 @@ def _gen_rlearner_model_final(self): is multidimensional, then the average of the MSEs for each dimension of Y is returned. """ - def __init__( - self, - *, - binary_outcome, - discrete_treatment, - treatment_featurizer, - categories, - cv, - random_state, - mc_iters=None, - mc_agg='mean', - allow_missing=False, - use_ray=False, - ray_remote_func_options=None): + def __init__(self, + *, + binary_outcome, + discrete_treatment, + treatment_featurizer, + categories, + cv, + random_state, + mc_iters=None, + mc_agg='mean', + allow_missing=False, + use_ray=False, + ray_remote_func_options=None): super().__init__(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment, treatment_featurizer=treatment_featurizer, diff --git a/econml/iv/dml/_dml.py b/econml/iv/dml/_dml.py index 9856b65d1..21d581edb 100644 --- a/econml/iv/dml/_dml.py +++ b/econml/iv/dml/_dml.py @@ -417,7 +417,6 @@ def _gen_ortho_learner_model_nuisance(self): is_discrete=self.discrete_instrument, random_state=self.random_state) - return _OrthoIVNuisanceSelector(model_y, model_t, model_z, self.projection) @@ -1170,8 +1169,6 @@ def _gen_model_t_xw(self): def _gen_model_t_xwz(self): return _make_first_stage_selector(self.model_t_xwz, self.discrete_treatment, self.random_state) - > main - def _gen_model_final(self): return clone(self.model_final, safe=False) diff --git a/econml/iv/dr/_dr.py b/econml/iv/dr/_dr.py index f04b5ffe7..458cd7ef6 100644 --- a/econml/iv/dr/_dr.py +++ b/econml/iv/dr/_dr.py @@ -2464,7 +2464,9 @@ def _gen_prel_model_effect(self): return clone(self.prel_model_effect, safe=False) def _gen_ortho_learner_model_nuisance(self): - model_y_xw = _make_first_stage_selector(self.model_y_xw, is_discrete=self.binary_outcome, random_state=self.random_state) + model_y_xw = _make_first_stage_selector(self.model_y_xw, + is_discrete=self.binary_outcome, + random_state=self.random_state) model_t_xwz = _make_first_stage_selector(self.model_t_xwz, is_discrete=True, random_state=self.random_state) if self.z_propensity == "auto": diff --git a/econml/panel/dml/_dml.py b/econml/panel/dml/_dml.py index 366475256..8235e6422 100644 --- a/econml/panel/dml/_dml.py +++ b/econml/panel/dml/_dml.py @@ -542,7 +542,9 @@ def _gen_featurizer(self): return clone(self.featurizer, safe=False) def _gen_model_y(self): - return _make_first_stage_selector(self.model_y, is_discrete=self.binary_outcome, random_state=self.random_state) + return _make_first_stage_selector(self.model_y, + is_discrete=self.binary_outcome, + random_state=self.random_state) def _gen_model_t(self): return _make_first_stage_selector(self.model_t, From e104d73110807d89f35b2067d408626aa7f595b1 Mon Sep 17 00:00:00 2001 From: Fabio Vera Date: Thu, 7 Dec 2023 14:21:54 -0500 Subject: [PATCH 14/25] more typos Signed-off-by: Fabio Vera --- econml/dml/dml.py | 1 - econml/iv/dr/_dr.py | 4 ++-- 2 files changed, 2 insertions(+), 3 deletions(-) diff --git a/econml/dml/dml.py b/econml/dml/dml.py index cdeacaf87..148d55451 100644 --- a/econml/dml/dml.py +++ b/econml/dml/dml.py @@ -722,7 +722,6 @@ def __init__(self, *, featurizer=None, treatment_featurizer=None, fit_cate_intercept=True, - linear_first_stages="deprecated, binary_outcome=False, linear_first_stages="deprecated", discrete_treatment=False, diff --git a/econml/iv/dr/_dr.py b/econml/iv/dr/_dr.py index 458cd7ef6..589f914e0 100644 --- a/econml/iv/dr/_dr.py +++ b/econml/iv/dr/_dr.py @@ -2464,7 +2464,7 @@ def _gen_prel_model_effect(self): return clone(self.prel_model_effect, safe=False) def _gen_ortho_learner_model_nuisance(self): - model_y_xw = _make_first_stage_selector(self.model_y_xw, + model_y_xw = _make_first_stage_selector(self.model_y_xw, is_discrete=self.binary_outcome, random_state=self.random_state) model_t_xwz = _make_first_stage_selector(self.model_t_xwz, is_discrete=True, random_state=self.random_state) @@ -2479,7 +2479,7 @@ def _gen_ortho_learner_model_nuisance(self): dummy_z = _make_first_stage_selector(dummy_z, is_discrete=True, random_state=self.random_state) return _IntentToTreatDRIVNuisanceSelector(model_y_xw, model_t_xwz, dummy_z, self._gen_prel_model_effect()) - + class _DummyCATE: """ From edc0b485a64f48654b551c05fa7fd3a28c8fe545 Mon Sep 17 00:00:00 2001 From: Fabio Vera Date: Fri, 15 Dec 2023 15:14:05 -0500 Subject: [PATCH 15/25] bugfixes, docstrings, enable for intenttotreatdrivs Signed-off-by: Fabio Vera --- econml/_ortho_learner.py | 7 +- econml/dml/_rlearner.py | 3 + econml/dml/causal_forest.py | 43 ++- econml/dml/dml.py | 219 ++++++++---- econml/dr/_drlearner.py | 152 +++++++-- econml/dynamic/dml/__init__.py | 40 ++- econml/iv/dml/_dml.py | 216 ++++++++---- econml/iv/dr/_dr.py | 512 ++++++++++++++++++++-------- econml/panel/dml/_dml.py | 43 ++- econml/policy/_drlearner.py | 68 +++- econml/tests/test_binary_outcome.py | 32 +- 11 files changed, 983 insertions(+), 352 deletions(-) diff --git a/econml/_ortho_learner.py b/econml/_ortho_learner.py index 84fdf3870..3b0d34e98 100644 --- a/econml/_ortho_learner.py +++ b/econml/_ortho_learner.py @@ -327,6 +327,9 @@ class _OrthoLearner(TreatmentExpansionMixin, LinearCateEstimator): Parameters ---------- + binary_outcome: bool + Whether the outcome should be treated as binary + discrete_treatment: bool Whether the treatment values should be treated as categorical, rather than continuous, quantities @@ -921,7 +924,7 @@ def _fit_nuisances(self, Y, T, X=None, W=None, Z=None, sample_weight=None, group Z = self.z_transformer.transform(reshape(Z, (-1, 1))) if self.binary_outcome: - Y = self.outcome_transformer.transform(Y) + Y = self.outcome_transformer.transform(Y).reshape(Y.shape) if self.cv == 1: # special case, no cross validation folds = None @@ -1054,7 +1057,7 @@ def score(self, Y, T, X=None, W=None, Z=None, sample_weight=None, groups=None): if self.z_transformer is not None: Z = self.z_transformer.transform(reshape(Z, (-1, 1))) if self.binary_outcome: - Y = self.outcome_transformer.transform(Y) + Y = self.outcome_transformer.transform(Y).reshape(Y.shape) n_iters = len(self._models_nuisance) n_splits = len(self._models_nuisance[0]) diff --git a/econml/dml/_rlearner.py b/econml/dml/_rlearner.py index 27932fd2c..2120c6e17 100644 --- a/econml/dml/_rlearner.py +++ b/econml/dml/_rlearner.py @@ -137,6 +137,9 @@ class _RLearner(_OrthoLearner): Parameters ---------- + binary_outcome: bool + Whether the outcome should be treated as binary + discrete_treatment: bool Whether the treatment values should be treated as categorical, rather than continuous, quantities diff --git a/econml/dml/causal_forest.py b/econml/dml/causal_forest.py index 4e525561e..6b8ea1bd2 100644 --- a/econml/dml/causal_forest.py +++ b/econml/dml/causal_forest.py @@ -268,17 +268,35 @@ class CausalForestDML(_BaseDML): Parameters ---------- - model_y: estimator or 'auto', default 'auto' - The estimator for fitting the response to the features. Must implement - `fit` and `predict` methods. - If 'auto' :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` will be chosen. - - model_t: estimator or 'auto', default 'auto' - The estimator for fitting the treatment to the features. - If estimator, it must implement `fit` and `predict` methods; - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` will be applied for discrete treatment, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied for continuous treatment. + model_y: estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' + Determines how to fit the treatment to the features. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if binary_outcome=True. + + model_t: estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' + Determines how to fit the treatment to the features. str in a sentence + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_treatment=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_treatment=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_treatment=True. featurizer : :term:`transformer`, optional Must support fit_transform and transform. Used to create composite features in the final CATE regression. @@ -290,6 +308,9 @@ class CausalForestDML(_BaseDML): The final CATE will be trained on the outcome of featurizer.fit_transform(T). If featurizer=None, then CATE is trained on T. + binary_outcome: bool, default ``False`` + Whether the outcome should be treated as binary + discrete_treatment: bool, default ``False`` Whether the treatment values should be treated as categorical, rather than continuous, quantities diff --git a/econml/dml/dml.py b/econml/dml/dml.py index 148d55451..c4fa78038 100644 --- a/econml/dml/dml.py +++ b/econml/dml/dml.py @@ -348,20 +348,35 @@ class takes as input the parameter `model_t`, which is an arbitrary scikit-learn Parameters ---------- - model_y: estimator or 'auto', default 'auto' - The estimator for fitting the response to the features. Must implement - `fit` and `predict` methods. - If 'auto' :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` will be chosen. - - model_t: estimator or 'auto' (default is 'auto') - The estimator for fitting the treatment to the features. - If estimator, it must implement `fit` and `predict` methods. Must be a linear model for correctness - when linear_first_stages is ``True``; - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete treatment, - and :class:`.WeightedLassoCV`/ - :class:`.WeightedMultiTaskLassoCV` - will be applied for continuous treatment. + model_y: estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' + Determines how to fit the treatment to the features. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if binary_outcome=True. + + model_t: estimator, {'linear', 'forest'}, list of str/estimator, or 'auto + Determines how to fit the treatment to the features. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_treatment=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_treatment=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_treatment=True. model_final: estimator The estimator for fitting the response residuals to the treatment residuals. Must implement @@ -384,7 +399,10 @@ class takes as input the parameter `model_t`, which is an arbitrary scikit-learn Whether the first stage models are linear (in which case we will expand the features passed to `model_y` accordingly) - discrete_treatment: bool, default False + binary_outcome: bool, default ``False`` + Whether the outcome should be treated as binary + + discrete_treatment: bool, default ``False`` Whether the treatment values should be treated as categorical, rather than continuous, quantities categories: 'auto' or list, default 'auto' @@ -483,7 +501,9 @@ class takes as input the parameter `model_t`, which is an arbitrary scikit-learn """ def __init__(self, *, - model_y, model_t, model_final, + model_y, + model_t, + model_final, featurizer=None, treatment_featurizer=None, fit_cate_intercept=True, @@ -602,17 +622,35 @@ class LinearDML(StatsModelsCateEstimatorMixin, DML): Parameters ---------- - model_y: estimator or 'auto', default 'auto' - The estimator for fitting the response to the features. Must implement - `fit` and `predict` methods. - If 'auto' :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` will be chosen. - - model_t: estimator or 'auto', default 'auto' - The estimator for fitting the treatment to the features. - If estimator, it must implement `fit` and `predict` methods; - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` will be applied for discrete treatment, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied for continuous treatment. + model_y: estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' + Determines how to fit the treatment to the features. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if binary_outcome=True. + + model_t: estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' + Determines how to fit the treatment to the features. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_treatment=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_treatment=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_treatment=True. featurizer : :term:`transformer`, optional Must support fit_transform and transform. Used to create composite features in the final CATE regression. @@ -631,6 +669,9 @@ class LinearDML(StatsModelsCateEstimatorMixin, DML): Whether the first stage models are linear (in which case we will expand the features passed to `model_y` accordingly) + binary_outcome: bool, default ``False`` + Whether the outcome should be treated as binary + discrete_treatment: bool, default ``False`` Whether the treatment values should be treated as categorical, rather than continuous, quantities @@ -722,8 +763,8 @@ def __init__(self, *, featurizer=None, treatment_featurizer=None, fit_cate_intercept=True, - binary_outcome=False, linear_first_stages="deprecated", + binary_outcome=False, discrete_treatment=False, categories='auto', cv=2, @@ -826,20 +867,35 @@ class SparseLinearDML(DebiasedLassoCateEstimatorMixin, DML): Parameters ---------- - model_y: estimator or 'auto', default 'auto' - The estimator for fitting the response to the features. Must implement - `fit` and `predict` methods. - If 'auto' :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` will be chosen. - - model_t: estimator or 'auto', default 'auto' - The estimator for fitting the treatment to the features. - If estimator, it must implement `fit` and `predict` methods, and must be a - linear model for correctness; - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete treatment, - and :class:`.WeightedLassoCV`/ - :class:`.WeightedMultiTaskLassoCV` - will be applied for continuous treatment. + model_y: estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' + Determines how to fit the treatment to the features. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if binary_outcome=True. + + model_t: estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' + Determines how to fit the treatment to the features. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_treatment=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_treatment=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_treatment=True. alpha: str or float, default 'auto' CATE L1 regularization applied through the debiased lasso in the final model. @@ -888,6 +944,9 @@ class SparseLinearDML(DebiasedLassoCateEstimatorMixin, DML): Whether the first stage models are linear (in which case we will expand the features passed to `model_y` accordingly) + binary_outcome: bool, default ``False`` + Whether the outcome should be treated as binary + discrete_treatment: bool, default ``False`` Whether the treatment values should be treated as categorical, rather than continuous, quantities @@ -1111,19 +1170,32 @@ class KernelDML(DML): Parameters ---------- - model_y: estimator or 'auto', default 'auto' - The estimator for fitting the response to the features. Must implement - `fit` and `predict` methods. - If 'auto' :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` will be chosen. - - model_t: estimator or 'auto', default 'auto' - The estimator for fitting the treatment to the features. - If estimator, it must implement `fit` and `predict` methods; - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete treatment, - and :class:`.WeightedLassoCV`/ - :class:`.WeightedMultiTaskLassoCV` - will be applied for continuous treatment. + model_y: estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' + Determines how to fit the treatment to the features. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if binary_outcome=True. + + model_t: estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' + Determines how to fit the treatment to the features. + + - If an estimator, will use the model as is for fitting. + + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_treatment=True. fit_cate_intercept : bool, default True Whether the linear CATE model should have a constant term. @@ -1134,6 +1206,9 @@ class KernelDML(DML): bw: float, default 1.0 The bandwidth of the Gaussian used to generate features + binary_outcome: bool, default ``False`` + Whether the outcome should be treated as binary + discrete_treatment: bool, default ``False`` Whether the treatment values should be treated as categorical, rather than continuous, quantities @@ -1320,13 +1395,32 @@ class NonParamDML(_BaseDML): Parameters ---------- - model_y: estimator - The estimator for fitting the response to the features. Must implement - `fit` and `predict` methods. Must be a linear model for correctness when linear_first_stages is ``True``. + model_y: estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' + Determines how to fit the treatment to the features. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models - model_t: estimator - The estimator for fitting the treatment to the features. Must implement - `fit` and `predict` methods. Must be a linear model for correctness when linear_first_stages is ``True``. + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if binary_outcome=True. + + model_t: estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' + Determines how to fit the treatment to the features. + + - If an estimator, will use the model as is for fitting. + + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_treatment=True. model_final: estimator The estimator for fitting the response residuals to the treatment residuals. Must implement @@ -1337,6 +1431,9 @@ class NonParamDML(_BaseDML): The transformer used to featurize the raw features when fitting the final model. Must implement a `fit_transform` method. + binary_outcome: bool, default ``False`` + Whether the outcome should be treated as binary + discrete_treatment: bool, default ``False`` Whether the treatment values should be treated as categorical, rather than continuous, quantities diff --git a/econml/dr/_drlearner.py b/econml/dr/_drlearner.py index 59883cbcd..c03f8b7ac 100644 --- a/econml/dr/_drlearner.py +++ b/econml/dr/_drlearner.py @@ -241,18 +241,35 @@ class takes as input the parameter ``model_regressor``, which is an arbitrary sc Parameters ---------- - model_propensity : scikit-learn classifier or 'auto', default 'auto' + model_propensity : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' Estimator for Pr[T=t | X, W]. Trained by regressing treatments on (features, controls) concatenated. - Must implement `fit` and `predict_proba` methods. The `fit` method must be able to accept X and T, - where T is a shape (n, ) array. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` will be chosen. - model_regression : scikit-learn regressor or 'auto', default 'auto' + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV + - 'forest' - RandomForestClassifier + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict', and 'predict_proba'. + + model_regression : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' Estimator for E[Y | X, W, T]. Trained by regressing Y on (features, controls, one-hot-encoded treatments) - concatenated. The one-hot-encoding excludes the baseline treatment. Must implement `fit` and - `predict` methods. If different models per treatment arm are desired, see the - :class:`.MultiModelWrapper` helper class. - If 'auto' :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` will be chosen. + concatenated. The one-hot-encoding excludes the baseline treatment. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if binary_outcome=True. model_final : estimator for the final cate model. Trained on regressing the doubly robust potential outcomes @@ -268,6 +285,9 @@ class takes as input the parameter ``model_regressor``, which is an arbitrary sc mono-task model and a separate clone of the model is trained for each outcome. Then predict(X) of the t-th clone will be the CATE of the t-th lexicographically ordered treatment compared to the baseline. + binary_outcome: bool, default False + Whether the outcome should be treated as binary + multitask_model_final : bool, default False Whether the model_final should be treated as a multi-task model. See description of model_final. @@ -783,18 +803,35 @@ class LinearDRLearner(StatsModelsCateEstimatorDiscreteMixin, DRLearner): Parameters ---------- - model_propensity : scikit-learn classifier or 'auto', default 'auto' + model_propensity : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' Estimator for Pr[T=t | X, W]. Trained by regressing treatments on (features, controls) concatenated. - Must implement `fit` and `predict_proba` methods. The `fit` method must be able to accept X and T, - where T is a shape (n, ) array. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` will be chosen. - model_regression : scikit-learn regressor or 'auto', default 'auto' + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV + - 'forest' - RandomForestClassifier + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict', and 'predict_proba'. + + model_regression : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' Estimator for E[Y | X, W, T]. Trained by regressing Y on (features, controls, one-hot-encoded treatments) - concatenated. The one-hot-encoding excludes the baseline treatment. Must implement `fit` and - `predict` methods. If different models per treatment arm are desired, see the - :class:`.MultiModelWrapper` helper class. - If 'auto' :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` will be chosen. + concatenated. The one-hot-encoding excludes the baseline treatment. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if binary_outcome=True. featurizer : :term:`transformer`, optional Must support fit_transform and transform. Used to create composite features in the final CATE regression. @@ -804,6 +841,9 @@ class LinearDRLearner(StatsModelsCateEstimatorDiscreteMixin, DRLearner): fit_cate_intercept : bool, default True Whether the linear CATE model should have a constant term. + binary_outcome: bool, default False + Whether the outcome should be treated as binary + min_propensity : float, default ``1e-6`` The minimum propensity at which to clip propensity estimates to avoid dividing by zero. @@ -903,9 +943,9 @@ class LinearDRLearner(StatsModelsCateEstimatorDiscreteMixin, DRLearner): def __init__(self, *, model_propensity='auto', model_regression='auto', - binary_outcome=False, featurizer=None, fit_cate_intercept=True, + binary_outcome=False, min_propensity=1e-6, categories='auto', cv=2, @@ -1048,18 +1088,35 @@ class SparseLinearDRLearner(DebiasedLassoCateEstimatorDiscreteMixin, DRLearner): Parameters ---------- - model_propensity : scikit-learn classifier or 'auto', default 'auto' + model_propensity : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' Estimator for Pr[T=t | X, W]. Trained by regressing treatments on (features, controls) concatenated. - Must implement `fit` and `predict_proba` methods. The `fit` method must be able to accept X and T, - where T is a shape (n, ) array. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` will be chosen. - model_regression : scikit-learn regressor or 'auto', default 'auto' + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV + - 'forest' - RandomForestClassifier + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict', and 'predict_proba'. + + model_regression : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' Estimator for E[Y | X, W, T]. Trained by regressing Y on (features, controls, one-hot-encoded treatments) - concatenated. The one-hot-encoding excludes the baseline treatment. Must implement `fit` and - `predict` methods. If different models per treatment arm are desired, see the - :class:`.MultiModelWrapper` helper class. - If 'auto' :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` will be chosen. + concatenated. The one-hot-encoding excludes the baseline treatment. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if binary_outcome=True. featurizer : :term:`transformer`, optional Must support fit_transform and transform. Used to create composite features in the final CATE regression. @@ -1069,6 +1126,9 @@ class SparseLinearDRLearner(DebiasedLassoCateEstimatorDiscreteMixin, DRLearner): fit_cate_intercept : bool, default True Whether the linear CATE model should have a constant term. + binary_outcome: bool, default False + Whether the outcome should be treated as binary + alpha: str | float, optional., default 'auto'. CATE L1 regularization applied through the debiased lasso in the final model. 'auto' corresponds to a CV form of the :class:`DebiasedLasso`. @@ -1330,16 +1390,38 @@ class ForestDRLearner(ForestModelFinalCateEstimatorDiscreteMixin, DRLearner): Parameters ---------- - model_propensity : scikit-learn classifier + model_propensity : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' Estimator for Pr[T=t | X, W]. Trained by regressing treatments on (features, controls) concatenated. - Must implement `fit` and `predict_proba` methods. The `fit` method must be able to accept X and T, - where T is a shape (n, ) array. - model_regression : scikit-learn regressor + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV + - 'forest' - RandomForestClassifier + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict', and 'predict_proba'. + + model_regression : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' Estimator for E[Y | X, W, T]. Trained by regressing Y on (features, controls, one-hot-encoded treatments) - concatenated. The one-hot-encoding excludes the baseline treatment. Must implement `fit` and - `predict` methods. If different models per treatment arm are desired, see the - :class:`~econml.utilities.MultiModelWrapper` helper class. + concatenated. The one-hot-encoding excludes the baseline treatment. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if binary_outcome=True. + + binary_outcome: bool, default False + Whether the outcome should be treated as binary min_propensity : float, default ``1e-6`` The minimum propensity at which to clip propensity estimates to avoid dividing by zero. diff --git a/econml/dynamic/dml/__init__.py b/econml/dynamic/dml/__init__.py index 0185ea702..6d9949296 100755 --- a/econml/dynamic/dml/__init__.py +++ b/econml/dynamic/dml/__init__.py @@ -44,17 +44,35 @@ def DynamicDML(*, Parameters ---------- - model_y: estimator or 'auto', default 'auto' - The estimator for fitting the response to the features. Must implement - `fit` and `predict` methods. - If 'auto' :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` will be chosen. - - model_t: estimator or 'auto', default 'auto' - The estimator for fitting the treatment to the features. - If estimator, it must implement `fit` and `predict` methods; - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` will be applied for discrete treatment, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied for continuous treatment. + model_y: estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' + Determines how to fit the treatment to the features. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if binary_outcome=True. + + model_t: estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' + Determines how to fit the treatment to the features. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_treatment=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_treatment=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_treatment=True. featurizer : :term:`transformer`, optional Must support fit_transform and transform. Used to create composite features in the final CATE regression. diff --git a/econml/iv/dml/_dml.py b/econml/iv/dml/_dml.py index 21d581edb..cc22cfdbc 100644 --- a/econml/iv/dml/_dml.py +++ b/econml/iv/dml/_dml.py @@ -204,30 +204,65 @@ class OrthoIV(LinearModelFinalCateEstimatorMixin, _OrthoLearner): Parameters ---------- - model_y_xw : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[Y | X, W]`. Must support `fit` and `predict` methods. - If 'auto' :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` will be chosen. - - model_t_xw : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[T | X, W]`. Must support `fit` and `predict` methods. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete treatment, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied for continuous treatment. - - model_t_xwz : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[T | X, W, Z]`. Must support `fit` and `predict` methods. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete treatment, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied for continuous treatment. - - model_z_xw : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[Z | X, W]`. Must support `fit` and `predict` methods. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete instrument, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied for continuous instrument. + model_y_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' + model to estimate :math:`\\E[Y | X, W]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if binary_outcome=True. + + model_t_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' + model to estimate :math:`\\E[T | X, W]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_treatment=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_treatment=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_treatment=True. + + model_t_xwz : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' + model to estimate :math:`\\E[T | X, W, Z]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_treatment=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_treatment=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_treatment=True. + + model_z_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' + model to estimate :math:`\\E[Z | X, W]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_instrument=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_instrument=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_instrument=True. projection: bool, default False If True, we fit a slight variant of OrthoIV where we use E[T|X, W, Z] as the instrument as opposed to Z, @@ -241,6 +276,9 @@ class OrthoIV(LinearModelFinalCateEstimatorMixin, _OrthoLearner): fit_cate_intercept : bool, default False Whether the linear CATE model should have a constant term. + binary_outcome: bool, default False + Whether the outcome should be treated as binary + discrete_treatment: bool, default False Whether the treatment values should be treated as categorical, rather than continuous, quantities @@ -996,23 +1034,50 @@ class DMLIV(_BaseDMLIV): Parameters ---------- - model_y_xw : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[Y | X, W]`. Must support `fit` and `predict` methods. - If 'auto' :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` will be chosen. - - model_t_xw : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[T | X, W]`. Must support `fit` and `predict` methods. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete treatment, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied for continuous treatment. - - model_t_xwz : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[T | X, W, Z]`. Must support `fit` and `predict` methods. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete treatment, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied for continuous treatment. + model_y_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' + model to estimate :math:`\\E[Y | X, W]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if binary_outcome=True. + + model_t_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' + Model to estimate :math:`\\E[T | X, W]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_treatment=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_treatment=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_treatment=True. + + model_t_xwz : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' + Model to estimate :math:`\\E[T | X, W, Z]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_treatment=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_treatment=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_treatment=True. model_final : estimator (default is :class:`.StatsModelsLinearRegression`) final model that at fit time takes as input :math:`(Y-\\E[Y|X])`, :math:`(\\E[T|X,Z]-\\E[T|X])` and X @@ -1028,6 +1093,9 @@ class DMLIV(_BaseDMLIV): discrete_instrument: bool, default False Whether the instrument values should be treated as categorical, rather than continuous, quantities + binary_outcome: bool, default False + Whether the outcome should be treated as binary + discrete_treatment: bool, default False Whether the treatment values should be treated as categorical, rather than continuous, quantities @@ -1374,25 +1442,50 @@ class NonParamDMLIV(_BaseDMLIV): Parameters ---------- - model_y_xw : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[Y | X, W]`. Must support `fit` and `predict` methods. - If 'auto' :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` will be chosen. - - model_t_xw : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[T | X, W]`. Must support `fit` and either `predict` or `predict_proba` methods, - depending on whether the treatment is discrete. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete treatment, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied for continuous treatment. - - model_t_xwz : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[T | X, W, Z]`. Must support `fit` and either `predict` or `predict_proba` - methods, depending on whether the treatment is discrete. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete treatment, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied for continuous treatment. + model_y_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' + model to estimate :math:`\\E[Y | X, W]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if binary_outcome=True. + + model_t_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' + Model to estimate :math:`\\E[T | X, W]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_treatment=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_treatment=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_treatment=True. + + model_t_xwz : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' + Model to estimate :math:`\\E[T | X, W, Z]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_treatment=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_treatment=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_treatment=True. model_final : estimator final model for predicting :math:`\\tilde{Y}` from X with sample weights V(X) @@ -1401,6 +1494,9 @@ class NonParamDMLIV(_BaseDMLIV): The transformer used to featurize the raw features when fitting the final model. Must implement a `fit_transform` method. + binary_outcome: bool, default False + Whether the outcome should be treated as binary + discrete_treatment: bool, default False Whether the treatment values should be treated as categorical, rather than continuous, quantities diff --git a/econml/iv/dr/_dr.py b/econml/iv/dr/_dr.py index 589f914e0..54ff0c523 100644 --- a/econml/iv/dr/_dr.py +++ b/econml/iv/dr/_dr.py @@ -711,39 +711,83 @@ class DRIV(_DRIV): Parameters ---------- - model_y_xw : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[Y | X, W]`. Must support `fit` and `predict` methods. - If 'auto' :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` will be chosen. - - model_t_xw : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[T | X, W]`. Must support `fit` and `predict` methods. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete treatment, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied for continuous treatment. - - model_z_xw : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[Z | X, W]`. Must support `fit` and `predict` methods. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete instrument, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied for continuous instrument. - - model_t_xwz : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[T | X, W, Z]`. Must support `fit` and `predict` methods. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete treatment, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied for continuous treatment. - - model_tz_xw : estimator or 'auto' (default is 'auto') + model_y_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' + model to estimate :math:`\\E[Y | X, W]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if binary_outcome=True. + + model_t_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' + Model to estimate :math:`\\E[T | X, W]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_treatment=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_treatment=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_treatment=True. + + model_z_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' + model to estimate :math:`\\E[Z | X, W]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_instrument=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_instrument=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_instrument=True. + + model_t_xwz : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' + Model to estimate :math:`\\E[T | X, W, Z]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_treatment=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_treatment=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_treatment=True. + + model_tz_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' model to estimate :math:`\\E[T*Z | X, W]` or :math:`\\E[\\tilde{T}*\\tilde{Z} | X, W]` depending on `fit_cov_directly`. - Must support `fit` and `predict` methods. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete instrument and discrete treatment with `fit_cov_directly=False`, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied otherwise. + Target will be discrete if discrete instrument and discrete treatment with `fit_cov_directly=False`, + else target will be continuous. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete target else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete target else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete target. fit_cov_directly : bool, default True Whether to fit :math:`\\E[\\tilde{T}*\\tilde{Z} | X, W]` instead of :math:`\\E[T*Z | X, W]`. @@ -790,6 +834,9 @@ class DRIV(_DRIV): it method will return a biased projection to the model_final space, biased to give more weight on parts of the feature space where the instrument is strong. + binary_outcome: bool, default False + Whether the outcome should be treated as binary + discrete_instrument: bool, default False Whether the instrument values should be treated as categorical, rather than continuous, quantities @@ -1197,39 +1244,83 @@ class LinearDRIV(StatsModelsCateEstimatorMixin, DRIV): Parameters ---------- - model_y_xw : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[Y | X, W]`. Must support `fit` and `predict` methods. - If 'auto' :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` will be chosen. - - model_t_xw : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[T | X, W]`. Must support `fit` and `predict` methods. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete treatment, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied for continuous treatment. - - model_z_xw : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[Z | X, W]`. Must support `fit` and `predict` methods. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete instrument, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied for continuous instrument. - - model_t_xwz : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[T | X, W, Z]`. Must support `fit` and `predict` methods. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete treatment, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied for continuous treatment. - - model_tz_xw : estimator or 'auto' (default is 'auto') + model_y_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' + model to estimate :math:`\\E[Y | X, W]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if binary_outcome=True. + + model_t_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' + model to estimate :math:`\\E[T | X, W]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_treatment=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_treatment=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_treatment=True. + + model_z_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' + model to estimate :math:`\\E[Z | X, W]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_instrument=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_instrument=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_instrument=True. + + model_t_xwz : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' + model to estimate :math:`\\E[T | X, W, Z]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_treatment=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_treatment=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_treatment=True. + + model_tz_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' model to estimate :math:`\\E[T*Z | X, W]` or :math:`\\E[\\tilde{T}*\\tilde{Z} | X, W]` depending on `fit_cov_directly`. - Must support `fit` and `predict` methods. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete instrument and discrete treatment with `fit_cov_directly=False`, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied otherwise. + Target will be discrete if discrete instrument and discrete treatment with `fit_cov_directly=False`, + else target will be continuous. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete target else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete target else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete target. fit_cov_directly : bool, default True Whether to fit :math:`\\E[\\tilde{T}*\\tilde{Z} | X, W]` instead of :math:`\\E[T*Z | X, W]`. @@ -1273,6 +1364,9 @@ class LinearDRIV(StatsModelsCateEstimatorMixin, DRIV): it method will return a biased projection to the model_final space, biased to give more weight on parts of the feature space where the instrument is strong. + binary_outcome: bool, default False + Whether the outcome should be treated as binary + discrete_instrument: bool, default False Whether the instrument values should be treated as categorical, rather than continuous, quantities @@ -1520,39 +1614,83 @@ class SparseLinearDRIV(DebiasedLassoCateEstimatorMixin, DRIV): Parameters ---------- - model_y_xw : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[Y | X, W]`. Must support `fit` and `predict` methods. - If 'auto' :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` will be chosen. - - model_t_xw : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[T | X, W]`. Must support `fit` and `predict` methods. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete treatment, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied for continuous treatment. - - model_z_xw : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[Z | X, W]`. Must support `fit` and `predict` methods. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete instrument, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied for continuous instrument. - - model_t_xwz : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[T | X, W, Z]`. Must support `fit` and `predict` methods. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete treatment, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied for continuous treatment. - - model_tz_xw : estimator or 'auto' (default is 'auto') + model_y_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' + model to estimate :math:`\\E[Y | X, W]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if binary_outcome=True. + + model_t_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' + model to estimate :math:`\\E[T | X, W]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_treatment=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_treatment=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_treatment=True. + + model_z_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' + model to estimate :math:`\\E[Z | X, W]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_instrument=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_instrument=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_instrument=True. + + model_t_xwz : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' + Model to estimate :math:`\\E[T | X, W, Z]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_treatment=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_treatment=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_treatment=True. + + model_tz_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' model to estimate :math:`\\E[T*Z | X, W]` or :math:`\\E[\\tilde{T}*\\tilde{Z} | X, W]` depending on `fit_cov_directly`. - Must support `fit` and `predict` methods. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete instrument and discrete treatment with `fit_cov_directly=False`, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied otherwise. + Target will be discrete if discrete instrument and discrete treatment with `fit_cov_directly=False`, + else target will be continuous. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete target else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete target else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete target. fit_cov_directly : bool, default True Whether to fit :math:`\\E[\\tilde{T}*\\tilde{Z} | X, W]` instead of :math:`\\E[T*Z | X, W]`. @@ -1626,6 +1764,9 @@ class SparseLinearDRIV(DebiasedLassoCateEstimatorMixin, DRIV): it method will return a biased projection to the model_final space, biased to give more weight on parts of the feature space where the instrument is strong. + binary_outcome: bool, default False + Whether the outcome should be treated as binary + discrete_instrument: bool, default False Whether the instrument values should be treated as categorical, rather than continuous, quantities @@ -1889,39 +2030,83 @@ class ForestDRIV(ForestModelFinalCateEstimatorMixin, DRIV): Parameters ---------- - model_y_xw : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[Y | X, W]`. Must support `fit` and `predict` methods. - If 'auto' :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` will be chosen. - - model_t_xw : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[T | X, W]`. Must support `fit` and `predict` methods. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete treatment, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied for continuous treatment. - - model_z_xw : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[Z | X, W]`. Must support `fit` and `predict` methods. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete instrument, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied for continuous instrument. - - model_t_xwz : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[T | X, W, Z]`. Must support `fit` and `predict` methods. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete treatment, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied for continuous treatment. - - model_tz_xw : estimator or 'auto' (default is 'auto') + model_y_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' + model to estimate :math:`\\E[Y | X, W]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if binary_outcome=True. + + model_t_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' + model to estimate :math:`\\E[T | X, W]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_treatment=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_treatment=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_treatment=True. + + model_z_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' + model to estimate :math:`\\E[Z | X, W]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_instrument=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_instrument=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_instrument=True. + + model_t_xwz : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' + model to estimate :math:`\\E[T | X, W, Z]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_treatment=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_treatment=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_treatment=True. + + model_tz_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' model to estimate :math:`\\E[T*Z | X, W]` or :math:`\\E[\\tilde{T}*\\tilde{Z} | X, W]` depending on `fit_cov_directly`. - Must support `fit` and `predict` methods. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete instrument and discrete treatment with `fit_cov_directly=False`, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied otherwise. + Target will be discrete if discrete instrument and discrete treatment with `fit_cov_directly=False`, + else target will be continuous. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete target else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete target else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete target. fit_cov_directly : bool, default True Whether to fit :math:`\\E[\\tilde{T}*\\tilde{Z} | X, W]` instead of :math:`\\E[T*Z | X, W]`. @@ -2067,6 +2252,9 @@ class ForestDRIV(ForestModelFinalCateEstimatorMixin, DRIV): it method will return a biased projection to the model_final space, biased to give more weight on parts of the feature space where the instrument is strong. + binary_outcome: bool, default False + Whether the outcome should be treated as binary + discrete_instrument: bool, default False Whether the instrument values should be treated as categorical, rather than continuous, quantities @@ -2429,6 +2617,7 @@ def __init__(self, *, z_propensity="auto", featurizer=None, fit_cate_intercept=False, + binary_outcome=False, cov_clip=1e-3, opt_reweighted=False, categories='auto', @@ -2447,6 +2636,7 @@ def __init__(self, *, super().__init__(model_final=model_final, featurizer=featurizer, fit_cate_intercept=fit_cate_intercept, + binary_outcome=binary_outcome, cov_clip=cov_clip, cv=cv, mc_iters=mc_iters, @@ -2504,14 +2694,35 @@ class IntentToTreatDRIV(_IntentToTreatDRIV): Parameters ---------- - model_y_xw : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[Y | X, W]`. Must support `fit` and `predict` methods. - If 'auto' :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` will be chosen. + model_y_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' + model to estimate :math:`\\E[Y | X, W]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if binary_outcome=True. - model_t_xwz : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[T | X, W, Z]`. Must support `fit` and `predict_proba` methods. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete treatment. + model_t_xwz : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' + model to estimate :math:`\\E[T | X, W, Z]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_treatment=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_treatment=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_treatment=True. flexible_model_effect : estimator or 'auto' (default is 'auto') a flexible model for a preliminary version of the CATE, must accept sample_weight at fit time. @@ -2655,6 +2866,7 @@ def __init__(self, *, z_propensity="auto", featurizer=None, fit_cate_intercept=False, + binary_outcome=True, cov_clip=1e-3, cv=3, mc_iters=None, @@ -2681,6 +2893,7 @@ def __init__(self, *, z_propensity=z_propensity, featurizer=featurizer, fit_cate_intercept=fit_cate_intercept, + binary_outcome=binary_outcome, cov_clip=cov_clip, opt_reweighted=opt_reweighted, categories=categories, @@ -2800,15 +3013,36 @@ class LinearIntentToTreatDRIV(StatsModelsCateEstimatorMixin, IntentToTreatDRIV): Parameters ---------- - model_y_xw : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[Y | X, W]`. Must support `fit` and `predict` methods. - If 'auto' :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` will be chosen. + model_y_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' + model to estimate :math:`\\E[Y | X, W]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if binary_outcome=True. - model_t_xwz : estimator or 'auto' (default is 'auto') - model to estimate :math:`\\E[T | X, W, Z]`. Must support `fit` and `predict_proba` methods. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` - will be applied for discrete treatment. + + model_t_xwz : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' + model to estimate :math:`\\E[T | X, W, Z]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_treatment=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_treatment=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_treatment=True. flexible_model_effect : estimator or 'auto' (default is 'auto') a flexible model for a preliminary version of the CATE, must accept sample_weight at fit time. @@ -2960,6 +3194,7 @@ def __init__(self, *, z_propensity="auto", featurizer=None, fit_cate_intercept=True, + binary_outcome=False, cov_clip=1e-3, cv=3, mc_iters=None, @@ -2980,6 +3215,7 @@ def __init__(self, *, z_propensity=z_propensity, featurizer=featurizer, fit_cate_intercept=fit_cate_intercept, + binary_outcome=binary_outcome, cov_clip=cov_clip, cv=cv, mc_iters=mc_iters, diff --git a/econml/panel/dml/_dml.py b/econml/panel/dml/_dml.py index 8235e6422..b85aa43aa 100644 --- a/econml/panel/dml/_dml.py +++ b/econml/panel/dml/_dml.py @@ -344,17 +344,35 @@ class DynamicDML(LinearModelFinalCateEstimatorMixin, _OrthoLearner): Parameters ---------- - model_y: estimator or 'auto', default 'auto' - The estimator for fitting the response to the features. Must implement - `fit` and `predict` methods. - If 'auto' :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` will be chosen. - - model_t: estimator or 'auto', default 'auto' - The estimator for fitting the treatment to the features. - If estimator, it must implement `fit` and `predict` methods; - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` will be applied for discrete treatment, - and :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` - will be applied for continuous treatment. + model_y: estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' + model to estimate :math:`\\E[Y | X, W]`. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if binary_outcome=True. + + model_t: estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' + Determines how to fit the treatment to the features. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV if discrete_treatment=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_treatment=True else RandomForestRegressor + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods, + and additionally 'predict_proba' if discrete_treatment=True. featurizer : :term:`transformer`, optional Must support fit_transform and transform. Used to create composite features in the final CATE regression. @@ -368,6 +386,9 @@ class DynamicDML(LinearModelFinalCateEstimatorMixin, _OrthoLearner): Whether the first stage models are linear (in which case we will expand the features passed to `model_y` accordingly) + binary_outcome: bool, default False + Whether the outcome should be treated as binary + discrete_treatment: bool, default ``False`` Whether the treatment values should be treated as categorical, rather than continuous, quantities diff --git a/econml/policy/_drlearner.py b/econml/policy/_drlearner.py index 05a50989a..2ee38c158 100644 --- a/econml/policy/_drlearner.py +++ b/econml/policy/_drlearner.py @@ -239,18 +239,34 @@ class takes as input the parameter ``model_regressor``, which is an arbitrary sc Parameters ---------- - model_propensity : scikit-learn classifier or 'auto', default 'auto' + model_propensity : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' Estimator for Pr[T=t | X, W]. Trained by regressing treatments on (features, controls) concatenated. - Must implement `fit` and `predict_proba` methods. The `fit` method must be able to accept X and T, - where T is a shape (n, ) array. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` will be chosen. - model_regression : scikit-learn regressor or 'auto', default 'auto' + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV + - 'forest' - RandomForestClassifier + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict', and 'predict_proba'. + + model_regression : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' Estimator for E[Y | X, W, T]. Trained by regressing Y on (features, controls, one-hot-encoded treatments) - concatenated. The one-hot-encoding excludes the baseline treatment. Must implement `fit` and - `predict` methods. If different models per treatment arm are desired, see the - :class:`.MultiModelWrapper` helper class. - If 'auto' :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` will be chosen. + concatenated. The one-hot-encoding excludes the baseline treatment. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV + - 'forest' - RandomForestClassifier + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods. featurizer : :term:`transformer`, optional Must support fit_transform and transform. Used to create composite features in the final CATE regression. @@ -635,18 +651,34 @@ class takes as input the parameter ``model_regressor``, which is an arbitrary sc Parameters ---------- - model_propensity : scikit-learn classifier or 'auto', default 'auto' + model_propensity : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' Estimator for Pr[T=t | X, W]. Trained by regressing treatments on (features, controls) concatenated. - Must implement `fit` and `predict_proba` methods. The `fit` method must be able to accept X and T, - where T is a shape (n, ) array. - If 'auto', :class:`~sklearn.linear_model.LogisticRegressionCV` will be chosen. - model_regression : scikit-learn regressor or 'auto', default 'auto' + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV + - 'forest' - RandomForestClassifier + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict', and 'predict_proba'. + + model_regression : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' Estimator for E[Y | X, W, T]. Trained by regressing Y on (features, controls, one-hot-encoded treatments) - concatenated. The one-hot-encoding excludes the baseline treatment. Must implement `fit` and - `predict` methods. If different models per treatment arm are desired, see the - :class:`.MultiModelWrapper` helper class. - If 'auto' :class:`.WeightedLassoCV`/:class:`.WeightedMultiTaskLassoCV` will be chosen. + concatenated. The one-hot-encoding excludes the baseline treatment. + + - If an estimator, will use the model as is for fitting. + - If str, will use model associated with the keyword. + + - 'linear' - LogisticRegressionCV + - 'forest' - RandomForestClassifier + - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ + and then use the best estimator for fitting. + - If 'auto', model will select over linear and forest models + + User-supplied estimators should support 'fit' and 'predict' methods. featurizer : :term:`transformer`, optional Must support fit_transform and transform. Used to create composite features in the final CATE regression. diff --git a/econml/tests/test_binary_outcome.py b/econml/tests/test_binary_outcome.py index ccf42bd24..127c19d7a 100644 --- a/econml/tests/test_binary_outcome.py +++ b/econml/tests/test_binary_outcome.py @@ -11,9 +11,9 @@ from econml._ortho_learner import _OrthoLearner from econml.dml import LinearDML, SparseLinearDML, KernelDML, CausalForestDML, NonParamDML -from econml.dr import LinearDRLearner +from econml.dr import LinearDRLearner, ForestDRLearner from econml.iv.dml import OrthoIV, DMLIV, NonParamDMLIV -from econml.iv.dr import DRIV, LinearDRIV, SparseLinearDRIV, ForestDRIV +from econml.iv.dr import DRIV, LinearDRIV, SparseLinearDRIV, ForestDRIV, IntentToTreatDRIV, LinearIntentToTreatDRIV from econml.orf import DMLOrthoForest from econml.utilities import filter_none_kwargs @@ -119,20 +119,42 @@ def gen_array(n, is_binary, d): if Z is not None: est_list = [ - DRIV(binary_outcome=binary_outcome), - DMLIV(binary_outcome=binary_outcome), - OrthoIV(binary_outcome=binary_outcome), + DRIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment, + discrete_instrument=discrete_instrument), + DMLIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment, + discrete_instrument=discrete_instrument), + OrthoIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment, + discrete_instrument=discrete_instrument), + LinearDRIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment, + discrete_instrument=discrete_instrument), + SparseLinearDRIV(binary_outcome=binary_outcome, + discrete_treatment=discrete_treatment, + discrete_instrument=discrete_instrument), + ForestDRIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment, + discrete_instrument=discrete_instrument), + OrthoIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment, + discrete_instrument=discrete_instrument), + NonParamDMLIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment, + discrete_instrument=discrete_instrument) ] + if discrete_instrument: + est_list += [ + LinearIntentToTreatDRIV(binary_outcome=binary_outcome), + IntentToTreatDRIV(binary_outcome=binary_outcome), + ] + else: est_list = [ LinearDML(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment), + SparseLinearDML(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment), CausalForestDML(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment) ] if discrete_treatment: est_list += [ LinearDRLearner(binary_outcome=binary_outcome), + ForestDRLearner(binary_outcome=binary_outcome), ] for est in est_list: From 79a3b07173f9673506cb514ce3dc6e11695e37cc Mon Sep 17 00:00:00 2001 From: Fabio Vera Date: Fri, 15 Dec 2023 15:45:29 -0500 Subject: [PATCH 16/25] fix default Signed-off-by: Fabio Vera --- econml/iv/dr/_dr.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/econml/iv/dr/_dr.py b/econml/iv/dr/_dr.py index 54ff0c523..abc1d601d 100644 --- a/econml/iv/dr/_dr.py +++ b/econml/iv/dr/_dr.py @@ -2866,7 +2866,7 @@ def __init__(self, *, z_propensity="auto", featurizer=None, fit_cate_intercept=False, - binary_outcome=True, + binary_outcome=False, cov_clip=1e-3, cv=3, mc_iters=None, From 17a0b361e6e6716b71b79e073a423c379d86cfd3 Mon Sep 17 00:00:00 2001 From: Fabio Vera Date: Fri, 15 Dec 2023 16:37:23 -0500 Subject: [PATCH 17/25] bugfixes Signed-off-by: Fabio Vera --- econml/_ortho_learner.py | 4 ++-- econml/tests/test_binary_outcome.py | 2 +- 2 files changed, 3 insertions(+), 3 deletions(-) diff --git a/econml/_ortho_learner.py b/econml/_ortho_learner.py index 3b0d34e98..f5f91b36e 100644 --- a/econml/_ortho_learner.py +++ b/econml/_ortho_learner.py @@ -924,7 +924,7 @@ def _fit_nuisances(self, Y, T, X=None, W=None, Z=None, sample_weight=None, group Z = self.z_transformer.transform(reshape(Z, (-1, 1))) if self.binary_outcome: - Y = self.outcome_transformer.transform(Y).reshape(Y.shape) + Y = self.outcome_transformer.transform(Y).reshape(-1, 1) if self.cv == 1: # special case, no cross validation folds = None @@ -1057,7 +1057,7 @@ def score(self, Y, T, X=None, W=None, Z=None, sample_weight=None, groups=None): if self.z_transformer is not None: Z = self.z_transformer.transform(reshape(Z, (-1, 1))) if self.binary_outcome: - Y = self.outcome_transformer.transform(Y).reshape(Y.shape) + Y = self.outcome_transformer.transform(Y).reshape(-1, 1) n_iters = len(self._models_nuisance) n_splits = len(self._models_nuisance[0]) diff --git a/econml/tests/test_binary_outcome.py b/econml/tests/test_binary_outcome.py index 127c19d7a..2547a8e72 100644 --- a/econml/tests/test_binary_outcome.py +++ b/econml/tests/test_binary_outcome.py @@ -135,7 +135,7 @@ def gen_array(n, is_binary, d): OrthoIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment, discrete_instrument=discrete_instrument), NonParamDMLIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment, - discrete_instrument=discrete_instrument) + discrete_instrument=discrete_instrument, model_final=LinearRegression()) ] if discrete_instrument: From 6ba3b1fe0cf8170b0eae8f2d535971a9f2c3a711 Mon Sep 17 00:00:00 2001 From: Fabio Vera Date: Tue, 2 Jan 2024 09:51:37 -0500 Subject: [PATCH 18/25] test_binary_outcome bugfix Signed-off-by: Fabio Vera --- econml/tests/test_binary_outcome.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/econml/tests/test_binary_outcome.py b/econml/tests/test_binary_outcome.py index 2547a8e72..c86eeb3ab 100644 --- a/econml/tests/test_binary_outcome.py +++ b/econml/tests/test_binary_outcome.py @@ -138,7 +138,7 @@ def gen_array(n, is_binary, d): discrete_instrument=discrete_instrument, model_final=LinearRegression()) ] - if discrete_instrument: + if discrete_instrument and discrete_treatment: est_list += [ LinearIntentToTreatDRIV(binary_outcome=binary_outcome), IntentToTreatDRIV(binary_outcome=binary_outcome), From 5d75de488bc88e8991116f04944889cc206c1d9f Mon Sep 17 00:00:00 2001 From: Fabio Vera Date: Tue, 2 Jan 2024 16:30:17 -0500 Subject: [PATCH 19/25] adjust tests Signed-off-by: Fabio Vera --- econml/tests/test_binary_outcome.py | 31 +++++++++++++++-------------- 1 file changed, 16 insertions(+), 15 deletions(-) diff --git a/econml/tests/test_binary_outcome.py b/econml/tests/test_binary_outcome.py index c86eeb3ab..8e935a9a8 100644 --- a/econml/tests/test_binary_outcome.py +++ b/econml/tests/test_binary_outcome.py @@ -134,8 +134,9 @@ def gen_array(n, is_binary, d): discrete_instrument=discrete_instrument), OrthoIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment, discrete_instrument=discrete_instrument), - NonParamDMLIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment, - discrete_instrument=discrete_instrument, model_final=LinearRegression()) + # uncomment when issue #837 is resolved + # NonParamDMLIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment, + # discrete_instrument=discrete_instrument, model_final=LinearRegression()) ] if discrete_instrument and discrete_treatment: @@ -166,16 +167,16 @@ def gen_array(n, is_binary, d): est.marginal_effect(T, X=X) est.ate(X=X) - # make sure the auto outcome model is a classifier - if hasattr(est, 'model_y'): - outcome_model_attr = 'models_y' - elif hasattr(est, 'model_regression'): - outcome_model_attr = 'models_regression' - elif hasattr(est, 'model_y_xw'): - outcome_model_attr = 'models_y_xw' - assert ( - hasattr( - getattr(est, outcome_model_attr)[0][0], - 'predict_proba' - ) - ), 'Auto outcome model is not a classifier!' + # make sure the auto outcome model is a classifier + if hasattr(est, 'model_y'): + outcome_model_attr = 'models_y' + elif hasattr(est, 'model_regression'): + outcome_model_attr = 'models_regression' + elif hasattr(est, 'model_y_xw'): + outcome_model_attr = 'models_y_xw' + assert ( + hasattr( + getattr(est, outcome_model_attr)[0][0], + 'predict_proba' + ) + ), 'Auto outcome model is not a classifier!' From 9e7d70149bf1c0de7fdbe201f6da0afe796a0c35 Mon Sep 17 00:00:00 2001 From: Fabio Vera Date: Fri, 5 Jan 2024 13:21:13 -0500 Subject: [PATCH 20/25] address comments; binary_outcome->discrete_outcome, improve warnings Signed-off-by: Fabio Vera --- econml/_ortho_learner.py | 56 ++++--------- econml/dml/_rlearner.py | 8 +- econml/dml/causal_forest.py | 14 ++-- econml/dml/dml.py | 72 ++++++++-------- econml/dr/_drlearner.py | 63 +++++++------- econml/dynamic/dml/__init__.py | 6 +- econml/iv/dml/_dml.py | 42 +++++----- econml/iv/dr/_dr.py | 84 +++++++++---------- econml/panel/dml/_dml.py | 14 ++-- econml/tests/test_bootstrap.py | 14 ++-- ...ry_outcome.py => test_discrete_outcome.py} | 52 ++++++------ econml/tests/test_missing_values.py | 2 +- econml/tests/test_ortho_learner.py | 15 ++-- econml/tests/test_treatment_featurization.py | 2 +- econml/tests/test_utilities.py | 13 ++- econml/utilities.py | 28 ++++++- 16 files changed, 253 insertions(+), 232 deletions(-) rename econml/tests/{test_binary_outcome.py => test_discrete_outcome.py} (72%) diff --git a/econml/_ortho_learner.py b/econml/_ortho_learner.py index f5f91b36e..76a51a374 100644 --- a/econml/_ortho_learner.py +++ b/econml/_ortho_learner.py @@ -43,7 +43,7 @@ class in this module implements the general logic in a very versatile way TreatmentExpansionMixin) from .inference import BootstrapInference from .utilities import (_deprecate_positional, check_input_arrays, - cross_product, filter_none_kwargs, + cross_product, filter_none_kwargs, single_strata_from_discrete_arrays, inverse_onehot, jacify_featurizer, ndim, reshape, shape, transpose) from .sklearn_extensions.model_selection import ModelSelector @@ -327,7 +327,7 @@ class _OrthoLearner(TreatmentExpansionMixin, LinearCateEstimator): Parameters ---------- - binary_outcome: bool + discrete_outcome: bool Whether the outcome should be treated as binary discrete_treatment: bool @@ -429,7 +429,7 @@ def _gen_ortho_learner_model_final(self): np.random.seed(123) X = np.random.normal(size=(100, 3)) y = X[:, 0] + X[:, 1] + np.random.normal(0, 0.1, size=(100,)) - est = OrthoLearner(cv=2, binary_outcome=False, discrete_treatment=False, treatment_featurizer=None, + est = OrthoLearner(cv=2, discrete_outcome=False, discrete_treatment=False, treatment_featurizer=None, discrete_instrument=False, categories='auto', random_state=None) est.fit(y, X[:, 0], W=X[:, 1:]) @@ -487,7 +487,7 @@ def _gen_ortho_learner_model_final(self): import scipy.special T = np.random.binomial(1, scipy.special.expit(W[:, 0])) y = T + W[:, 0] + np.random.normal(0, 0.01, size=(100,)) - est = OrthoLearner(cv=2, binary_outcome=False, discrete_treatment=True, discrete_instrument=False, + est = OrthoLearner(cv=2, discrete_outcome=False, discrete_treatment=True, discrete_instrument=False, treatment_featurizer=None, categories='auto', random_state=None) est.fit(y, T, W=W) @@ -519,7 +519,7 @@ def _gen_ortho_learner_model_final(self): """ def __init__(self, *, - binary_outcome, + discrete_outcome, discrete_treatment, treatment_featurizer, discrete_instrument, @@ -532,7 +532,7 @@ def __init__(self, *, use_ray=False, ray_remote_func_options=None): self.cv = cv - self.binary_outcome = binary_outcome + self.discrete_outcome = discrete_outcome self.discrete_treatment = discrete_treatment self.treatment_featurizer = treatment_featurizer self.discrete_instrument = discrete_instrument @@ -629,40 +629,14 @@ def _strata(self, Y, T, X=None, W=None, Z=None, sample_weight=None, freq_weight=None, sample_var=None, groups=None, cache_values=False, only_final=False, check_input=True): arrs = [] - if self.binary_outcome: + if self.discrete_outcome: arrs.append(Y) if self.discrete_treatment: arrs.append(T) if self.discrete_instrument: arrs.append(Z) - return self._single_strata_from_discrete_arrays(arrs) - - """ - Combine multiple discrete arrays into a single array for stratification purposes: - - e.g. if arrs are - [0 1 2 0 1 2 0 1 2 0 1 2], - [0 1 0 1 0 1 0 1 0 1 0 1], - [0 0 0 0 0 0 1 1 1 1 1 1] - then output will be - [0 8 4 6 2 10 1 9 5 7 3 11] - - Every distinct combination of these discrete arrays will have it's own label. - """ - - def _single_strata_from_discrete_arrays(self, arrs): - if not arrs: - return None - - curr_array = np.zeros(shape=arrs[0].ravel().shape, dtype='int') - - for arr in arrs: - enc = LabelEncoder() - temp = enc.fit_transform(arr.ravel()) - curr_array = temp + curr_array * len(enc.classes_) - - return curr_array + return single_strata_from_discrete_arrays(arrs) def _prefit(self, Y, T, *args, only_final=False, **kwargs): @@ -739,15 +713,17 @@ def fit(self, Y, T, *, X=None, W=None, Z=None, sample_weight=None, freq_weight=N if not only_final: - if self.binary_outcome: + if self.discrete_outcome: self.outcome_transformer = LabelEncoder() self.outcome_transformer.fit(Y) if Y.shape[1:] and Y.shape[1] > 1: raise ValueError( - f"Only one outcome variable is supported when binary_outcome=True. Got Y of shape {Y.shape}") + f"Only one outcome variable is supported when discrete_outcome=True. Got Y of shape {Y.shape}") if len(self.outcome_transformer.classes_) > 2: raise AttributeError( - "More than 2 outcome classes detected. This method currently only supports binary outcomes") + f"({self.outcome_transformer.classes_} outcome classes detected. \ + Currently, only 2 outcome classes are allowed when discrete_outcome=True. \ + Classes provided include {self.outcome_transformer.classes_[:5]}") else: self.outcome_transformer = None @@ -910,7 +886,7 @@ def refit_final(self, inference=None): def _fit_nuisances(self, Y, T, X=None, W=None, Z=None, sample_weight=None, groups=None): # use a binary array to get stratified split in case of discrete treatment - stratify = self.discrete_treatment or self.discrete_instrument or self.binary_outcome + stratify = self.discrete_treatment or self.discrete_instrument or self.discrete_outcome strata = self._strata(Y, T, X=X, W=W, Z=Z, sample_weight=sample_weight, groups=groups) if strata is None: strata = T # always safe to pass T as second arg to split even if we're not actually stratifying @@ -923,7 +899,7 @@ def _fit_nuisances(self, Y, T, X=None, W=None, Z=None, sample_weight=None, group if self.discrete_instrument: Z = self.z_transformer.transform(reshape(Z, (-1, 1))) - if self.binary_outcome: + if self.discrete_outcome: Y = self.outcome_transformer.transform(Y).reshape(-1, 1) if self.cv == 1: # special case, no cross validation @@ -1056,7 +1032,7 @@ def score(self, Y, T, X=None, W=None, Z=None, sample_weight=None, groups=None): X, T = self._expand_treatments(X, T) if self.z_transformer is not None: Z = self.z_transformer.transform(reshape(Z, (-1, 1))) - if self.binary_outcome: + if self.discrete_outcome: Y = self.outcome_transformer.transform(Y).reshape(-1, 1) n_iters = len(self._models_nuisance) n_splits = len(self._models_nuisance[0]) diff --git a/econml/dml/_rlearner.py b/econml/dml/_rlearner.py index 2120c6e17..b4c346b26 100644 --- a/econml/dml/_rlearner.py +++ b/econml/dml/_rlearner.py @@ -137,7 +137,7 @@ class _RLearner(_OrthoLearner): Parameters ---------- - binary_outcome: bool + discrete_outcome: bool Whether the outcome should be treated as binary discrete_treatment: bool @@ -245,7 +245,7 @@ def _gen_rlearner_model_final(self): np.random.seed(123) X = np.random.normal(size=(1000, 3)) y = X[:, 0] + X[:, 1] + np.random.normal(0, 0.01, size=(1000,)) - est = RLearner(cv=2, binary_outcome=False, discrete_treatment=False, + est = RLearner(cv=2, discrete_outcome=False, discrete_treatment=False, treatment_featurizer=None, categories='auto', random_state=None) est.fit(y, X[:, 0], X=np.ones((X.shape[0], 1)), W=X[:, 1:]) @@ -295,7 +295,7 @@ def _gen_rlearner_model_final(self): def __init__(self, *, - binary_outcome, + discrete_outcome, discrete_treatment, treatment_featurizer, categories, @@ -306,7 +306,7 @@ def __init__(self, allow_missing=False, use_ray=False, ray_remote_func_options=None): - super().__init__(binary_outcome=binary_outcome, + super().__init__(discrete_outcome=discrete_outcome, discrete_treatment=discrete_treatment, treatment_featurizer=treatment_featurizer, discrete_instrument=False, # no instrument, so doesn't matter diff --git a/econml/dml/causal_forest.py b/econml/dml/causal_forest.py index 6b8ea1bd2..a3affed39 100644 --- a/econml/dml/causal_forest.py +++ b/econml/dml/causal_forest.py @@ -274,14 +274,14 @@ class CausalForestDML(_BaseDML): - If an estimator, will use the model as is for fitting. - If str, will use model associated with the keyword. - - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper - - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - 'linear' - LogisticRegressionCV if discrete_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_outcome=True else RandomForestRegressor - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ and then use the best estimator for fitting. - If 'auto', model will select over linear and forest models User-supplied estimators should support 'fit' and 'predict' methods, - and additionally 'predict_proba' if binary_outcome=True. + and additionally 'predict_proba' if discrete_outcome=True. model_t: estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' Determines how to fit the treatment to the features. str in a sentence @@ -308,7 +308,7 @@ class CausalForestDML(_BaseDML): The final CATE will be trained on the outcome of featurizer.fit_transform(T). If featurizer=None, then CATE is trained on T. - binary_outcome: bool, default ``False`` + discrete_outcome: bool, default ``False`` Whether the outcome should be treated as binary discrete_treatment: bool, default ``False`` @@ -609,7 +609,7 @@ def __init__(self, *, model_t='auto', featurizer=None, treatment_featurizer=None, - binary_outcome=False, + discrete_outcome=False, discrete_treatment=False, categories='auto', cv=2, @@ -666,7 +666,7 @@ def __init__(self, *, self.subforest_size = subforest_size self.n_jobs = n_jobs self.verbose = verbose - super().__init__(binary_outcome=binary_outcome, + super().__init__(discrete_outcome=discrete_outcome, discrete_treatment=discrete_treatment, treatment_featurizer=treatment_featurizer, categories=categories, @@ -691,7 +691,7 @@ def _gen_featurizer(self): return clone(self.featurizer, safe=False) def _gen_model_y(self): - return _make_first_stage_selector(self.model_y, self.binary_outcome, self.random_state) + return _make_first_stage_selector(self.model_y, self.discrete_outcome, self.random_state) def _gen_model_t(self): return _make_first_stage_selector(self.model_t, self.discrete_treatment, self.random_state) diff --git a/econml/dml/dml.py b/econml/dml/dml.py index c4fa78038..8dcab2347 100644 --- a/econml/dml/dml.py +++ b/econml/dml/dml.py @@ -52,8 +52,14 @@ def __init__(self, model, discrete_target): def predict(self, X, W): n_samples = X.shape[0] if X is not None else (W.shape[0] if W is not None else 1) if self._discrete_target: - return self._model.predict_proba(_combine(X, W, n_samples))[:, 1:] + if hasattr(self._model, 'predict_proba'): + return self._model.predict_proba(_combine(X, W, n_samples))[:, 1:] + else: + warn('First stage model has discrete target but model is not a classifier!', UserWarning) + return self._model.predict(_combine(X, W, n_samples)) else: + if hasattr(self._model, 'predict_proba'): + raise AttributeError("Cannot use a classifier as a first stage model when the target is continuous!") return self._model.predict(_combine(X, W, n_samples)) def score(self, X, W, Target, sample_weight=None): @@ -354,14 +360,14 @@ class takes as input the parameter `model_t`, which is an arbitrary scikit-learn - If an estimator, will use the model as is for fitting. - If str, will use model associated with the keyword. - - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper - - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - 'linear' - LogisticRegressionCV if discrete_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_outcome=True else RandomForestRegressor - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ and then use the best estimator for fitting. - If 'auto', model will select over linear and forest models User-supplied estimators should support 'fit' and 'predict' methods, - and additionally 'predict_proba' if binary_outcome=True. + and additionally 'predict_proba' if discrete_outcome=True. model_t: estimator, {'linear', 'forest'}, list of str/estimator, or 'auto Determines how to fit the treatment to the features. @@ -399,7 +405,7 @@ class takes as input the parameter `model_t`, which is an arbitrary scikit-learn Whether the first stage models are linear (in which case we will expand the features passed to `model_y` accordingly) - binary_outcome: bool, default ``False`` + discrete_outcome: bool, default ``False`` Whether the outcome should be treated as binary discrete_treatment: bool, default ``False`` @@ -508,7 +514,7 @@ def __init__(self, *, treatment_featurizer=None, fit_cate_intercept=True, linear_first_stages="deprecated", - binary_outcome=False, + discrete_outcome=False, discrete_treatment=False, categories='auto', cv=2, @@ -528,7 +534,7 @@ def __init__(self, *, self.model_y = clone(model_y, safe=False) self.model_t = clone(model_t, safe=False) self.model_final = clone(model_final, safe=False) - super().__init__(binary_outcome=binary_outcome, + super().__init__(discrete_outcome=discrete_outcome, discrete_treatment=discrete_treatment, treatment_featurizer=treatment_featurizer, categories=categories, @@ -547,7 +553,7 @@ def _gen_featurizer(self): return clone(self.featurizer, safe=False) def _gen_model_y(self): - return _make_first_stage_selector(self.model_y, self.binary_outcome, self.random_state) + return _make_first_stage_selector(self.model_y, self.discrete_outcome, self.random_state) def _gen_model_t(self): return _make_first_stage_selector(self.model_t, self.discrete_treatment, self.random_state) @@ -628,14 +634,14 @@ class LinearDML(StatsModelsCateEstimatorMixin, DML): - If an estimator, will use the model as is for fitting. - If str, will use model associated with the keyword. - - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper - - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - 'linear' - LogisticRegressionCV if discrete_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_outcome=True else RandomForestRegressor - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ and then use the best estimator for fitting. - If 'auto', model will select over linear and forest models User-supplied estimators should support 'fit' and 'predict' methods, - and additionally 'predict_proba' if binary_outcome=True. + and additionally 'predict_proba' if discrete_outcome=True. model_t: estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' Determines how to fit the treatment to the features. @@ -669,7 +675,7 @@ class LinearDML(StatsModelsCateEstimatorMixin, DML): Whether the first stage models are linear (in which case we will expand the features passed to `model_y` accordingly) - binary_outcome: bool, default ``False`` + discrete_outcome: bool, default ``False`` Whether the outcome should be treated as binary discrete_treatment: bool, default ``False`` @@ -764,7 +770,7 @@ def __init__(self, *, treatment_featurizer=None, fit_cate_intercept=True, linear_first_stages="deprecated", - binary_outcome=False, + discrete_outcome=False, discrete_treatment=False, categories='auto', cv=2, @@ -783,7 +789,7 @@ def __init__(self, *, treatment_featurizer=treatment_featurizer, fit_cate_intercept=fit_cate_intercept, linear_first_stages=linear_first_stages, - binary_outcome=binary_outcome, + discrete_outcome=discrete_outcome, discrete_treatment=discrete_treatment, categories=categories, cv=cv, @@ -873,14 +879,14 @@ class SparseLinearDML(DebiasedLassoCateEstimatorMixin, DML): - If an estimator, will use the model as is for fitting. - If str, will use model associated with the keyword. - - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper - - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - 'linear' - LogisticRegressionCV if discrete_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_outcome=True else RandomForestRegressor - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ and then use the best estimator for fitting. - If 'auto', model will select over linear and forest models User-supplied estimators should support 'fit' and 'predict' methods, - and additionally 'predict_proba' if binary_outcome=True. + and additionally 'predict_proba' if discrete_outcome=True. model_t: estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' Determines how to fit the treatment to the features. @@ -944,7 +950,7 @@ class SparseLinearDML(DebiasedLassoCateEstimatorMixin, DML): Whether the first stage models are linear (in which case we will expand the features passed to `model_y` accordingly) - binary_outcome: bool, default ``False`` + discrete_outcome: bool, default ``False`` Whether the outcome should be treated as binary discrete_treatment: bool, default ``False`` @@ -1046,7 +1052,7 @@ def __init__(self, *, treatment_featurizer=None, fit_cate_intercept=True, linear_first_stages=True, - binary_outcome=False, + discrete_outcome=False, discrete_treatment=False, categories='auto', cv=2, @@ -1070,7 +1076,7 @@ def __init__(self, *, treatment_featurizer=treatment_featurizer, fit_cate_intercept=fit_cate_intercept, linear_first_stages=linear_first_stages, - binary_outcome=binary_outcome, + discrete_outcome=discrete_outcome, discrete_treatment=discrete_treatment, categories=categories, cv=cv, @@ -1176,14 +1182,14 @@ class KernelDML(DML): - If an estimator, will use the model as is for fitting. - If str, will use model associated with the keyword. - - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper - - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - 'linear' - LogisticRegressionCV if discrete_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_outcome=True else RandomForestRegressor - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ and then use the best estimator for fitting. - If 'auto', model will select over linear and forest models User-supplied estimators should support 'fit' and 'predict' methods, - and additionally 'predict_proba' if binary_outcome=True. + and additionally 'predict_proba' if discrete_outcome=True. model_t: estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' Determines how to fit the treatment to the features. @@ -1206,7 +1212,7 @@ class KernelDML(DML): bw: float, default 1.0 The bandwidth of the Gaussian used to generate features - binary_outcome: bool, default ``False`` + discrete_outcome: bool, default ``False`` Whether the outcome should be treated as binary discrete_treatment: bool, default ``False`` @@ -1289,7 +1295,7 @@ class KernelDML(DML): """ def __init__(self, model_y='auto', model_t='auto', - binary_outcome=False, + discrete_outcome=False, discrete_treatment=False, treatment_featurizer=None, categories='auto', @@ -1310,7 +1316,7 @@ def __init__(self, model_y='auto', model_t='auto', featurizer=None, treatment_featurizer=treatment_featurizer, fit_cate_intercept=fit_cate_intercept, - binary_outcome=binary_outcome, + discrete_outcome=discrete_outcome, discrete_treatment=discrete_treatment, categories=categories, cv=cv, @@ -1401,14 +1407,14 @@ class NonParamDML(_BaseDML): - If an estimator, will use the model as is for fitting. - If str, will use model associated with the keyword. - - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper - - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - 'linear' - LogisticRegressionCV if discrete_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_outcome=True else RandomForestRegressor - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ and then use the best estimator for fitting. - If 'auto', model will select over linear and forest models User-supplied estimators should support 'fit' and 'predict' methods, - and additionally 'predict_proba' if binary_outcome=True. + and additionally 'predict_proba' if discrete_outcome=True. model_t: estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' Determines how to fit the treatment to the features. @@ -1431,7 +1437,7 @@ class NonParamDML(_BaseDML): The transformer used to featurize the raw features when fitting the final model. Must implement a `fit_transform` method. - binary_outcome: bool, default ``False`` + discrete_outcome: bool, default ``False`` Whether the outcome should be treated as binary discrete_treatment: bool, default ``False`` @@ -1523,7 +1529,7 @@ class NonParamDML(_BaseDML): def __init__(self, *, model_y, model_t, model_final, featurizer=None, - binary_outcome=False, + discrete_outcome=False, discrete_treatment=False, treatment_featurizer=None, categories='auto', @@ -1540,7 +1546,7 @@ def __init__(self, *, self.model_t = clone(model_t, safe=False) self.featurizer = clone(featurizer, safe=False) self.model_final = clone(model_final, safe=False) - super().__init__(binary_outcome=binary_outcome, + super().__init__(discrete_outcome=discrete_outcome, discrete_treatment=discrete_treatment, treatment_featurizer=treatment_featurizer, categories=categories, @@ -1566,7 +1572,7 @@ def _gen_featurizer(self): return clone(self.featurizer, safe=False) def _gen_model_y(self): - return _make_first_stage_selector(self.model_y, is_discrete=self.binary_outcome, + return _make_first_stage_selector(self.model_y, is_discrete=self.discrete_outcome, random_state=self.random_state) def _gen_model_t(self): diff --git a/econml/dr/_drlearner.py b/econml/dr/_drlearner.py index c03f8b7ac..b08883f3b 100644 --- a/econml/dr/_drlearner.py +++ b/econml/dr/_drlearner.py @@ -63,11 +63,11 @@ def __init__(self, model_propensity: SingleModelSelector, model_regression: SingleModelSelector, min_propensity, - binary_outcome): + discrete_outcome): self._model_propensity = model_propensity self._model_regression = model_regression self._min_propensity = min_propensity - self._binary_outcome = binary_outcome + self._discrete_outcome = discrete_outcome def _combine(self, X, W): return np.hstack([arr for arr in [X, W] if arr is not None]) @@ -103,15 +103,18 @@ def predict(self, Y, T, X=None, W=None, *, sample_weight=None, groups=None): n = T.shape[0] Y_pred = np.zeros((T.shape[0], T.shape[1] + 1)) T_counter = np.zeros(T.shape) - if self._binary_outcome and hasattr(self._model_regression, 'predict_proba'): + if self._discrete_outcome and hasattr(self._model_regression, 'predict_proba'): Y_pred[:, 0] = self._model_regression.predict_proba(np.hstack([XW, T_counter]))[:, 1].reshape(n) else: + if self._discrete_outcome: + warn("A regressor was passed when discrete_outcome=True. \ + Using a classifier is recommended.", UserWarning) Y_pred[:, 0] = self._model_regression.predict(np.hstack([XW, T_counter])).reshape(n) Y_pred[:, 0] += (Y.reshape(n) - Y_pred[:, 0]) * np.all(T == 0, axis=1) / propensities[:, 0] for t in np.arange(T.shape[1]): T_counter = np.zeros(T.shape) T_counter[:, t] = 1 - if self._binary_outcome and hasattr(self._model_regression, 'predict_proba'): + if self._discrete_outcome and hasattr(self._model_regression, 'predict_proba'): Y_pred[:, t + 1] = self._model_regression.predict_proba(np.hstack([XW, T_counter]))[:, 1].reshape(n) else: Y_pred[:, t + 1] = self._model_regression.predict(np.hstack([XW, T_counter])).reshape(n) @@ -262,14 +265,14 @@ class takes as input the parameter ``model_regressor``, which is an arbitrary sc - If an estimator, will use the model as is for fitting. - If str, will use model associated with the keyword. - - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper - - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - 'linear' - LogisticRegressionCV if discrete_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_outcome=True else RandomForestRegressor - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ and then use the best estimator for fitting. - If 'auto', model will select over linear and forest models User-supplied estimators should support 'fit' and 'predict' methods, - and additionally 'predict_proba' if binary_outcome=True. + and additionally 'predict_proba' if discrete_outcome=True. model_final : estimator for the final cate model. Trained on regressing the doubly robust potential outcomes @@ -285,7 +288,7 @@ class takes as input the parameter ``model_regressor``, which is an arbitrary sc mono-task model and a separate clone of the model is trained for each outcome. Then predict(X) of the t-th clone will be the CATE of the t-th lexicographically ordered treatment compared to the baseline. - binary_outcome: bool, default False + discrete_outcome: bool, default False Whether the outcome should be treated as binary multitask_model_final : bool, default False @@ -445,7 +448,7 @@ def __init__(self, *, model_propensity='auto', model_regression='auto', model_final=StatsModelsLinearRegression(), - binary_outcome=False, + discrete_outcome=False, multitask_model_final=False, featurizer=None, min_propensity=1e-6, @@ -467,7 +470,7 @@ def __init__(self, *, super().__init__(cv=cv, mc_iters=mc_iters, mc_agg=mc_agg, - binary_outcome=binary_outcome, + discrete_outcome=discrete_outcome, discrete_treatment=True, treatment_featurizer=None, # treatment featurization not supported with discrete treatment discrete_instrument=False, # no instrument, so doesn't matter @@ -534,9 +537,9 @@ def _get_inference_options(self): def _gen_ortho_learner_model_nuisance(self): model_propensity = _make_first_stage_selector(self.model_propensity, True, self.random_state) - model_regression = _make_first_stage_selector(self.model_regression, self.binary_outcome, self.random_state) + model_regression = _make_first_stage_selector(self.model_regression, self.discrete_outcome, self.random_state) - return _ModelNuisance(model_propensity, model_regression, self.min_propensity, self.binary_outcome) + return _ModelNuisance(model_propensity, model_regression, self.min_propensity, self.discrete_outcome) def _gen_featurizer(self): return clone(self.featurizer, safe=False) @@ -824,14 +827,14 @@ class LinearDRLearner(StatsModelsCateEstimatorDiscreteMixin, DRLearner): - If an estimator, will use the model as is for fitting. - If str, will use model associated with the keyword. - - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper - - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - 'linear' - LogisticRegressionCV if discrete_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_outcome=True else RandomForestRegressor - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ and then use the best estimator for fitting. - If 'auto', model will select over linear and forest models User-supplied estimators should support 'fit' and 'predict' methods, - and additionally 'predict_proba' if binary_outcome=True. + and additionally 'predict_proba' if discrete_outcome=True. featurizer : :term:`transformer`, optional Must support fit_transform and transform. Used to create composite features in the final CATE regression. @@ -841,7 +844,7 @@ class LinearDRLearner(StatsModelsCateEstimatorDiscreteMixin, DRLearner): fit_cate_intercept : bool, default True Whether the linear CATE model should have a constant term. - binary_outcome: bool, default False + discrete_outcome: bool, default False Whether the outcome should be treated as binary min_propensity : float, default ``1e-6`` @@ -945,7 +948,7 @@ def __init__(self, *, model_regression='auto', featurizer=None, fit_cate_intercept=True, - binary_outcome=False, + discrete_outcome=False, min_propensity=1e-6, categories='auto', cv=2, @@ -960,7 +963,7 @@ def __init__(self, *, super().__init__(model_propensity=model_propensity, model_regression=model_regression, model_final=None, - binary_outcome=binary_outcome, + discrete_outcome=discrete_outcome, featurizer=featurizer, multitask_model_final=False, min_propensity=min_propensity, @@ -1109,14 +1112,14 @@ class SparseLinearDRLearner(DebiasedLassoCateEstimatorDiscreteMixin, DRLearner): - If an estimator, will use the model as is for fitting. - If str, will use model associated with the keyword. - - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper - - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - 'linear' - LogisticRegressionCV if discrete_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_outcome=True else RandomForestRegressor - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ and then use the best estimator for fitting. - If 'auto', model will select over linear and forest models User-supplied estimators should support 'fit' and 'predict' methods, - and additionally 'predict_proba' if binary_outcome=True. + and additionally 'predict_proba' if discrete_outcome=True. featurizer : :term:`transformer`, optional Must support fit_transform and transform. Used to create composite features in the final CATE regression. @@ -1126,7 +1129,7 @@ class SparseLinearDRLearner(DebiasedLassoCateEstimatorDiscreteMixin, DRLearner): fit_cate_intercept : bool, default True Whether the linear CATE model should have a constant term. - binary_outcome: bool, default False + discrete_outcome: bool, default False Whether the outcome should be treated as binary alpha: str | float, optional., default 'auto'. @@ -1260,7 +1263,7 @@ def __init__(self, *, model_regression='auto', featurizer=None, fit_cate_intercept=True, - binary_outcome=False, + discrete_outcome=False, alpha='auto', n_alphas=100, alpha_cov='auto', @@ -1289,7 +1292,7 @@ def __init__(self, *, super().__init__(model_propensity=model_propensity, model_regression=model_regression, model_final=None, - binary_outcome=binary_outcome, + discrete_outcome=discrete_outcome, featurizer=featurizer, multitask_model_final=False, min_propensity=min_propensity, @@ -1411,16 +1414,16 @@ class ForestDRLearner(ForestModelFinalCateEstimatorDiscreteMixin, DRLearner): - If an estimator, will use the model as is for fitting. - If str, will use model associated with the keyword. - - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper - - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - 'linear' - LogisticRegressionCV if discrete_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_outcome=True else RandomForestRegressor - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ and then use the best estimator for fitting. - If 'auto', model will select over linear and forest models User-supplied estimators should support 'fit' and 'predict' methods, - and additionally 'predict_proba' if binary_outcome=True. + and additionally 'predict_proba' if discrete_outcome=True. - binary_outcome: bool, default False + discrete_outcome: bool, default False Whether the outcome should be treated as binary min_propensity : float, default ``1e-6`` @@ -1583,7 +1586,7 @@ class ForestDRLearner(ForestModelFinalCateEstimatorDiscreteMixin, DRLearner): def __init__(self, *, model_regression="auto", model_propensity="auto", - binary_outcome=False, + discrete_outcome=False, featurizer=None, min_propensity=1e-6, categories='auto', @@ -1623,7 +1626,7 @@ def __init__(self, *, super().__init__(model_regression=model_regression, model_propensity=model_propensity, model_final=None, - binary_outcome=binary_outcome, + discrete_outcome=discrete_outcome, featurizer=featurizer, multitask_model_final=False, min_propensity=min_propensity, diff --git a/econml/dynamic/dml/__init__.py b/econml/dynamic/dml/__init__.py index 6d9949296..4fef96fd1 100755 --- a/econml/dynamic/dml/__init__.py +++ b/econml/dynamic/dml/__init__.py @@ -50,14 +50,14 @@ def DynamicDML(*, - If an estimator, will use the model as is for fitting. - If str, will use model associated with the keyword. - - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper - - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - 'linear' - LogisticRegressionCV if discrete_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_outcome=True else RandomForestRegressor - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ and then use the best estimator for fitting. - If 'auto', model will select over linear and forest models User-supplied estimators should support 'fit' and 'predict' methods, - and additionally 'predict_proba' if binary_outcome=True. + and additionally 'predict_proba' if discrete_outcome=True. model_t: estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' Determines how to fit the treatment to the features. diff --git a/econml/iv/dml/_dml.py b/econml/iv/dml/_dml.py index cc22cfdbc..27e85fe7d 100644 --- a/econml/iv/dml/_dml.py +++ b/econml/iv/dml/_dml.py @@ -210,14 +210,14 @@ class OrthoIV(LinearModelFinalCateEstimatorMixin, _OrthoLearner): - If an estimator, will use the model as is for fitting. - If str, will use model associated with the keyword. - - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper - - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - 'linear' - LogisticRegressionCV if discrete_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_outcome=True else RandomForestRegressor - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ and then use the best estimator for fitting. - If 'auto', model will select over linear and forest models User-supplied estimators should support 'fit' and 'predict' methods, - and additionally 'predict_proba' if binary_outcome=True. + and additionally 'predict_proba' if discrete_outcome=True. model_t_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' model to estimate :math:`\\E[T | X, W]`. @@ -276,7 +276,7 @@ class OrthoIV(LinearModelFinalCateEstimatorMixin, _OrthoLearner): fit_cate_intercept : bool, default False Whether the linear CATE model should have a constant term. - binary_outcome: bool, default False + discrete_outcome: bool, default False Whether the outcome should be treated as binary discrete_treatment: bool, default False @@ -392,7 +392,7 @@ def __init__(self, *, projection=False, featurizer=None, fit_cate_intercept=True, - binary_outcome=False, + discrete_outcome=False, discrete_treatment=False, treatment_featurizer=None, discrete_instrument=False, @@ -410,7 +410,7 @@ def __init__(self, *, self.featurizer = clone(featurizer, safe=False) self.fit_cate_intercept = fit_cate_intercept - super().__init__(binary_outcome=binary_outcome, + super().__init__(discrete_outcome=discrete_outcome, discrete_instrument=discrete_instrument, discrete_treatment=discrete_treatment, treatment_featurizer=treatment_featurizer, @@ -435,7 +435,7 @@ def _gen_ortho_learner_model_final(self): def _gen_ortho_learner_model_nuisance(self): model_y = _make_first_stage_selector(self.model_y_xw, - is_discrete=self.binary_outcome, + is_discrete=self.discrete_outcome, random_state=self.random_state) model_t = _make_first_stage_selector(self.model_t_xw, @@ -1040,14 +1040,14 @@ class DMLIV(_BaseDMLIV): - If an estimator, will use the model as is for fitting. - If str, will use model associated with the keyword. - - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper - - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - 'linear' - LogisticRegressionCV if discrete_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_outcome=True else RandomForestRegressor - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ and then use the best estimator for fitting. - If 'auto', model will select over linear and forest models User-supplied estimators should support 'fit' and 'predict' methods, - and additionally 'predict_proba' if binary_outcome=True. + and additionally 'predict_proba' if discrete_outcome=True. model_t_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' Model to estimate :math:`\\E[T | X, W]`. @@ -1093,7 +1093,7 @@ class DMLIV(_BaseDMLIV): discrete_instrument: bool, default False Whether the instrument values should be treated as categorical, rather than continuous, quantities - binary_outcome: bool, default False + discrete_outcome: bool, default False Whether the outcome should be treated as binary discrete_treatment: bool, default False @@ -1198,7 +1198,7 @@ def __init__(self, *, model_final=StatsModelsLinearRegression(fit_intercept=False), featurizer=None, fit_cate_intercept=True, - binary_outcome=False, + discrete_outcome=False, discrete_treatment=False, treatment_featurizer=None, discrete_instrument=False, @@ -1214,7 +1214,7 @@ def __init__(self, *, self.model_final = clone(model_final, safe=False) self.featurizer = clone(featurizer, safe=False) self.fit_cate_intercept = fit_cate_intercept - super().__init__(binary_outcome=binary_outcome, + super().__init__(discrete_outcome=discrete_outcome, discrete_treatment=discrete_treatment, treatment_featurizer=treatment_featurizer, discrete_instrument=discrete_instrument, @@ -1229,7 +1229,7 @@ def _gen_featurizer(self): return clone(self.featurizer, safe=False) def _gen_model_y_xw(self): - return _make_first_stage_selector(self.model_y_xw, self.binary_outcome, self.random_state) + return _make_first_stage_selector(self.model_y_xw, self.discrete_outcome, self.random_state) def _gen_model_t_xw(self): return _make_first_stage_selector(self.model_t_xw, self.discrete_treatment, self.random_state) @@ -1448,14 +1448,14 @@ class NonParamDMLIV(_BaseDMLIV): - If an estimator, will use the model as is for fitting. - If str, will use model associated with the keyword. - - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper - - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - 'linear' - LogisticRegressionCV if discrete_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_outcome=True else RandomForestRegressor - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ and then use the best estimator for fitting. - If 'auto', model will select over linear and forest models User-supplied estimators should support 'fit' and 'predict' methods, - and additionally 'predict_proba' if binary_outcome=True. + and additionally 'predict_proba' if discrete_outcome=True. model_t_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' Model to estimate :math:`\\E[T | X, W]`. @@ -1494,7 +1494,7 @@ class NonParamDMLIV(_BaseDMLIV): The transformer used to featurize the raw features when fitting the final model. Must implement a `fit_transform` method. - binary_outcome: bool, default False + discrete_outcome: bool, default False Whether the outcome should be treated as binary discrete_treatment: bool, default False @@ -1601,7 +1601,7 @@ def __init__(self, *, model_t_xw="auto", model_t_xwz="auto", model_final, - binary_outcome=False, + discrete_outcome=False, discrete_treatment=False, treatment_featurizer=None, discrete_instrument=False, @@ -1617,7 +1617,7 @@ def __init__(self, *, self.model_t_xwz = clone(model_t_xwz, safe=False) self.model_final = clone(model_final, safe=False) self.featurizer = clone(featurizer, safe=False) - super().__init__(binary_outcome=binary_outcome, + super().__init__(discrete_outcome=discrete_outcome, discrete_treatment=discrete_treatment, discrete_instrument=discrete_instrument, treatment_featurizer=treatment_featurizer, @@ -1632,7 +1632,7 @@ def _gen_featurizer(self): return clone(self.featurizer, safe=False) def _gen_model_y_xw(self): - return _make_first_stage_selector(self.model_y_xw, self.binary_outcome, self.random_state) + return _make_first_stage_selector(self.model_y_xw, self.discrete_outcome, self.random_state) def _gen_model_t_xw(self): return _make_first_stage_selector(self.model_t_xw, self.discrete_treatment, self.random_state) diff --git a/econml/iv/dr/_dr.py b/econml/iv/dr/_dr.py index abc1d601d..2dceef7c8 100644 --- a/econml/iv/dr/_dr.py +++ b/econml/iv/dr/_dr.py @@ -364,7 +364,7 @@ def __init__(self, *, fit_cate_intercept=False, cov_clip=1e-3, opt_reweighted=False, - binary_outcome=False, + discrete_outcome=False, discrete_instrument=False, discrete_treatment=False, treatment_featurizer=None, @@ -381,7 +381,7 @@ def __init__(self, *, self.fit_cate_intercept = fit_cate_intercept self.cov_clip = cov_clip self.opt_reweighted = opt_reweighted - super().__init__(binary_outcome=binary_outcome, + super().__init__(discrete_outcome=discrete_outcome, discrete_instrument=discrete_instrument, discrete_treatment=discrete_treatment, treatment_featurizer=treatment_featurizer, @@ -625,7 +625,7 @@ def __init__(self, *, fit_cate_intercept=False, cov_clip=1e-3, opt_reweighted=False, - binary_outcome=False, + discrete_outcome=False, discrete_instrument=False, discrete_treatment=False, treatment_featurizer=None, @@ -651,7 +651,7 @@ def __init__(self, *, fit_cate_intercept=fit_cate_intercept, cov_clip=cov_clip, opt_reweighted=opt_reweighted, - binary_outcome=binary_outcome, + discrete_outcome=discrete_outcome, discrete_instrument=discrete_instrument, discrete_treatment=discrete_treatment, treatment_featurizer=treatment_featurizer, @@ -668,7 +668,7 @@ def _gen_prel_model_effect(self): return clone(self.prel_model_effect, safe=False) def _gen_ortho_learner_model_nuisance(self): - model_y_xw = _make_first_stage_selector(self.model_y_xw, self.binary_outcome, self.random_state) + model_y_xw = _make_first_stage_selector(self.model_y_xw, self.discrete_outcome, self.random_state) model_t_xw = _make_first_stage_selector(self.model_t_xw, self.discrete_treatment, self.random_state) if self.projection: @@ -717,14 +717,14 @@ class DRIV(_DRIV): - If an estimator, will use the model as is for fitting. - If str, will use model associated with the keyword. - - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper - - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - 'linear' - LogisticRegressionCV if discrete_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_outcome=True else RandomForestRegressor - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ and then use the best estimator for fitting. - If 'auto', model will select over linear and forest models User-supplied estimators should support 'fit' and 'predict' methods, - and additionally 'predict_proba' if binary_outcome=True. + and additionally 'predict_proba' if discrete_outcome=True. model_t_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' Model to estimate :math:`\\E[T | X, W]`. @@ -834,7 +834,7 @@ class DRIV(_DRIV): it method will return a biased projection to the model_final space, biased to give more weight on parts of the feature space where the instrument is strong. - binary_outcome: bool, default False + discrete_outcome: bool, default False Whether the outcome should be treated as binary discrete_instrument: bool, default False @@ -954,7 +954,7 @@ def __init__(self, *, fit_cate_intercept=False, cov_clip=1e-3, opt_reweighted=False, - binary_outcome=False, + discrete_outcome=False, discrete_instrument=False, discrete_treatment=False, treatment_featurizer=None, @@ -987,7 +987,7 @@ def __init__(self, *, fit_cate_intercept=fit_cate_intercept, cov_clip=cov_clip, opt_reweighted=opt_reweighted, - binary_outcome=binary_outcome, + discrete_outcome=discrete_outcome, discrete_instrument=discrete_instrument, discrete_treatment=discrete_treatment, treatment_featurizer=treatment_featurizer, @@ -1250,14 +1250,14 @@ class LinearDRIV(StatsModelsCateEstimatorMixin, DRIV): - If an estimator, will use the model as is for fitting. - If str, will use model associated with the keyword. - - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper - - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - 'linear' - LogisticRegressionCV if discrete_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_outcome=True else RandomForestRegressor - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ and then use the best estimator for fitting. - If 'auto', model will select over linear and forest models User-supplied estimators should support 'fit' and 'predict' methods, - and additionally 'predict_proba' if binary_outcome=True. + and additionally 'predict_proba' if discrete_outcome=True. model_t_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' model to estimate :math:`\\E[T | X, W]`. @@ -1364,7 +1364,7 @@ class LinearDRIV(StatsModelsCateEstimatorMixin, DRIV): it method will return a biased projection to the model_final space, biased to give more weight on parts of the feature space where the instrument is strong. - binary_outcome: bool, default False + discrete_outcome: bool, default False Whether the outcome should be treated as binary discrete_instrument: bool, default False @@ -1495,7 +1495,7 @@ def __init__(self, *, fit_cate_intercept=True, cov_clip=1e-3, opt_reweighted=False, - binary_outcome=False, + discrete_outcome=False, discrete_instrument=False, discrete_treatment=False, treatment_featurizer=None, @@ -1524,7 +1524,7 @@ def __init__(self, *, fit_cate_intercept=fit_cate_intercept, cov_clip=cov_clip, opt_reweighted=opt_reweighted, - binary_outcome=binary_outcome, + discrete_outcome=discrete_outcome, discrete_instrument=discrete_instrument, discrete_treatment=discrete_treatment, treatment_featurizer=treatment_featurizer, @@ -1620,14 +1620,14 @@ class SparseLinearDRIV(DebiasedLassoCateEstimatorMixin, DRIV): - If an estimator, will use the model as is for fitting. - If str, will use model associated with the keyword. - - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper - - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - 'linear' - LogisticRegressionCV if discrete_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_outcome=True else RandomForestRegressor - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ and then use the best estimator for fitting. - If 'auto', model will select over linear and forest models User-supplied estimators should support 'fit' and 'predict' methods, - and additionally 'predict_proba' if binary_outcome=True. + and additionally 'predict_proba' if discrete_outcome=True. model_t_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' model to estimate :math:`\\E[T | X, W]`. @@ -1764,7 +1764,7 @@ class SparseLinearDRIV(DebiasedLassoCateEstimatorMixin, DRIV): it method will return a biased projection to the model_final space, biased to give more weight on parts of the feature space where the instrument is strong. - binary_outcome: bool, default False + discrete_outcome: bool, default False Whether the outcome should be treated as binary discrete_instrument: bool, default False @@ -1902,7 +1902,7 @@ def __init__(self, *, n_jobs=None, cov_clip=1e-3, opt_reweighted=False, - binary_outcome=False, + discrete_outcome=False, discrete_instrument=False, discrete_treatment=False, treatment_featurizer=None, @@ -1937,7 +1937,7 @@ def __init__(self, *, fit_cate_intercept=fit_cate_intercept, cov_clip=cov_clip, opt_reweighted=opt_reweighted, - binary_outcome=binary_outcome, + discrete_outcome=discrete_outcome, discrete_instrument=discrete_instrument, discrete_treatment=discrete_treatment, treatment_featurizer=treatment_featurizer, @@ -2036,14 +2036,14 @@ class ForestDRIV(ForestModelFinalCateEstimatorMixin, DRIV): - If an estimator, will use the model as is for fitting. - If str, will use model associated with the keyword. - - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper - - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - 'linear' - LogisticRegressionCV if discrete_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_outcome=True else RandomForestRegressor - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ and then use the best estimator for fitting. - If 'auto', model will select over linear and forest models User-supplied estimators should support 'fit' and 'predict' methods, - and additionally 'predict_proba' if binary_outcome=True. + and additionally 'predict_proba' if discrete_outcome=True. model_t_xw : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' model to estimate :math:`\\E[T | X, W]`. @@ -2252,7 +2252,7 @@ class ForestDRIV(ForestModelFinalCateEstimatorMixin, DRIV): it method will return a biased projection to the model_final space, biased to give more weight on parts of the feature space where the instrument is strong. - binary_outcome: bool, default False + discrete_outcome: bool, default False Whether the outcome should be treated as binary discrete_instrument: bool, default False @@ -2386,7 +2386,7 @@ def __init__(self, *, verbose=0, cov_clip=1e-3, opt_reweighted=False, - binary_outcome=False, + discrete_outcome=False, discrete_instrument=False, discrete_treatment=False, treatment_featurizer=None, @@ -2427,7 +2427,7 @@ def __init__(self, *, fit_cate_intercept=False, cov_clip=cov_clip, opt_reweighted=opt_reweighted, - binary_outcome=binary_outcome, + discrete_outcome=discrete_outcome, discrete_instrument=discrete_instrument, discrete_treatment=discrete_treatment, treatment_featurizer=treatment_featurizer, @@ -2617,7 +2617,7 @@ def __init__(self, *, z_propensity="auto", featurizer=None, fit_cate_intercept=False, - binary_outcome=False, + discrete_outcome=False, cov_clip=1e-3, opt_reweighted=False, categories='auto', @@ -2636,7 +2636,7 @@ def __init__(self, *, super().__init__(model_final=model_final, featurizer=featurizer, fit_cate_intercept=fit_cate_intercept, - binary_outcome=binary_outcome, + discrete_outcome=discrete_outcome, cov_clip=cov_clip, cv=cv, mc_iters=mc_iters, @@ -2655,7 +2655,7 @@ def _gen_prel_model_effect(self): def _gen_ortho_learner_model_nuisance(self): model_y_xw = _make_first_stage_selector(self.model_y_xw, - is_discrete=self.binary_outcome, + is_discrete=self.discrete_outcome, random_state=self.random_state) model_t_xwz = _make_first_stage_selector(self.model_t_xwz, is_discrete=True, random_state=self.random_state) @@ -2700,14 +2700,14 @@ class IntentToTreatDRIV(_IntentToTreatDRIV): - If an estimator, will use the model as is for fitting. - If str, will use model associated with the keyword. - - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper - - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - 'linear' - LogisticRegressionCV if discrete_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_outcome=True else RandomForestRegressor - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ and then use the best estimator for fitting. - If 'auto', model will select over linear and forest models User-supplied estimators should support 'fit' and 'predict' methods, - and additionally 'predict_proba' if binary_outcome=True. + and additionally 'predict_proba' if discrete_outcome=True. model_t_xwz : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' model to estimate :math:`\\E[T | X, W, Z]`. @@ -2866,7 +2866,7 @@ def __init__(self, *, z_propensity="auto", featurizer=None, fit_cate_intercept=False, - binary_outcome=False, + discrete_outcome=False, cov_clip=1e-3, cv=3, mc_iters=None, @@ -2893,7 +2893,7 @@ def __init__(self, *, z_propensity=z_propensity, featurizer=featurizer, fit_cate_intercept=fit_cate_intercept, - binary_outcome=binary_outcome, + discrete_outcome=discrete_outcome, cov_clip=cov_clip, opt_reweighted=opt_reweighted, categories=categories, @@ -3019,14 +3019,14 @@ class LinearIntentToTreatDRIV(StatsModelsCateEstimatorMixin, IntentToTreatDRIV): - If an estimator, will use the model as is for fitting. - If str, will use model associated with the keyword. - - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper - - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - 'linear' - LogisticRegressionCV if discrete_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_outcome=True else RandomForestRegressor - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ and then use the best estimator for fitting. - If 'auto', model will select over linear and forest models User-supplied estimators should support 'fit' and 'predict' methods, - and additionally 'predict_proba' if binary_outcome=True. + and additionally 'predict_proba' if discrete_outcome=True. model_t_xwz : estimator, {'linear', 'forest'}, list of str/estimator, or 'auto', default 'auto' @@ -3194,7 +3194,7 @@ def __init__(self, *, z_propensity="auto", featurizer=None, fit_cate_intercept=True, - binary_outcome=False, + discrete_outcome=False, cov_clip=1e-3, cv=3, mc_iters=None, @@ -3215,7 +3215,7 @@ def __init__(self, *, z_propensity=z_propensity, featurizer=featurizer, fit_cate_intercept=fit_cate_intercept, - binary_outcome=binary_outcome, + discrete_outcome=discrete_outcome, cov_clip=cov_clip, cv=cv, mc_iters=mc_iters, diff --git a/econml/panel/dml/_dml.py b/econml/panel/dml/_dml.py index b85aa43aa..094a230d4 100644 --- a/econml/panel/dml/_dml.py +++ b/econml/panel/dml/_dml.py @@ -350,14 +350,14 @@ class DynamicDML(LinearModelFinalCateEstimatorMixin, _OrthoLearner): - If an estimator, will use the model as is for fitting. - If str, will use model associated with the keyword. - - 'linear' - LogisticRegressionCV if binary_outcome=True else WeightedLassoCVWrapper - - 'forest' - RandomForestClassifier if binary_outcome=True else RandomForestRegressor + - 'linear' - LogisticRegressionCV if discrete_outcome=True else WeightedLassoCVWrapper + - 'forest' - RandomForestClassifier if discrete_outcome=True else RandomForestRegressor - If list, will perform model selection on the supplied list, which can be a mix of str and estimators, \ and then use the best estimator for fitting. - If 'auto', model will select over linear and forest models User-supplied estimators should support 'fit' and 'predict' methods, - and additionally 'predict_proba' if binary_outcome=True. + and additionally 'predict_proba' if discrete_outcome=True. model_t: estimator, {'linear', 'forest'}, list of str/estimator, or 'auto' Determines how to fit the treatment to the features. @@ -386,7 +386,7 @@ class DynamicDML(LinearModelFinalCateEstimatorMixin, _OrthoLearner): Whether the first stage models are linear (in which case we will expand the features passed to `model_y` accordingly) - binary_outcome: bool, default False + discrete_outcome: bool, default False Whether the outcome should be treated as binary discrete_treatment: bool, default ``False`` @@ -489,7 +489,7 @@ def __init__(self, *, featurizer=None, fit_cate_intercept=True, linear_first_stages=False, - binary_outcome=False, + discrete_outcome=False, discrete_treatment=False, categories='auto', cv=2, @@ -502,7 +502,7 @@ def __init__(self, *, self.featurizer = clone(featurizer, safe=False) self.model_y = clone(model_y, safe=False) self.model_t = clone(model_t, safe=False) - super().__init__(binary_outcome=binary_outcome, + super().__init__(discrete_outcome=discrete_outcome, discrete_treatment=discrete_treatment, treatment_featurizer=None, discrete_instrument=False, @@ -564,7 +564,7 @@ def _gen_featurizer(self): def _gen_model_y(self): return _make_first_stage_selector(self.model_y, - is_discrete=self.binary_outcome, + is_discrete=self.discrete_outcome, random_state=self.random_state) def _gen_model_t(self): diff --git a/econml/tests/test_bootstrap.py b/econml/tests/test_bootstrap.py index 3145ef07b..df15f9cdb 100644 --- a/econml/tests/test_bootstrap.py +++ b/econml/tests/test_bootstrap.py @@ -270,8 +270,8 @@ def test_internal_options(self): def test_stratify(self): """Test that we can properly stratify by treatment""" - T = np.array([1, 0, 1, 2, 0, 2]) - Y = np.array([1, 2, 3, 4, 5, 6]) + T = [1, 0, 1, 2, 0, 2] + Y = [1, 2, 3, 4, 5, 6] X = np.array([1, 1, 2, 2, 1, 2]).reshape(-1, 1) est = LinearDML(model_y=LinearRegression(), model_t=LogisticRegression(), discrete_treatment=True) inference = BootstrapInference(n_bootstrap_samples=5, n_jobs=-1, verbose=0) @@ -286,9 +286,9 @@ def test_stratify(self): def test_stratify_orthoiv(self): """Test that we can properly stratify by treatment/instrument pair""" - T = np.array([1, 0, 1, 1, 0, 0, 1, 0]) - Z = np.array([1, 0, 0, 1, 0, 1, 0, 1]) - Y = np.array([1, 2, 3, 4, 5, 6, 7, 8]) + T = [1, 0, 1, 1, 0, 0, 1, 0] + Z = [1, 0, 0, 1, 0, 1, 0, 1] + Y = [1, 2, 3, 4, 5, 6, 7, 8] X = np.array([1, 1, 2, 2, 1, 2, 1, 2]).reshape(-1, 1) est = LinearIntentToTreatDRIV(model_y_xw=LinearRegression(), model_t_xwz=LogisticRegression(), flexible_model_effect=LinearRegression(), cv=2) @@ -297,8 +297,8 @@ def test_stratify_orthoiv(self): est.const_marginal_effect_interval(X) def test_all_kinds(self): - T = np.array([1, 0, 1, 2, 0, 2] * 5) - Y = np.array([1, 2, 3, 4, 5, 6] * 5) + T = [1, 0, 1, 2, 0, 2] * 5 + Y = [1, 2, 3, 4, 5, 6] * 5 X = np.array([1, 1, 2, 2, 1, 2] * 5).reshape(-1, 1) est = LinearDML(cv=2) for kind in ['percentile', 'pivot', 'normal']: diff --git a/econml/tests/test_binary_outcome.py b/econml/tests/test_discrete_outcome.py similarity index 72% rename from econml/tests/test_binary_outcome.py rename to econml/tests/test_discrete_outcome.py index 8e935a9a8..b8e650478 100644 --- a/econml/tests/test_binary_outcome.py +++ b/econml/tests/test_discrete_outcome.py @@ -20,11 +20,11 @@ from copy import deepcopy -class TestBinaryOutcome(unittest.TestCase): +class TestDiscreteOutcome(unittest.TestCase): # accuracy test def test_accuracy(self): n = 1000 - binary_outcome = True + discrete_outcome = True discrete_treatment = True true_ate = 0.3 W = np.random.uniform(-1, 1, size=(n, 1)) @@ -32,9 +32,9 @@ def test_accuracy(self): Y = np.random.binomial(1, .5 + true_ate * D + .1 * W[:, 0], size=(n,)) ests = [ - LinearDML(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment), - CausalForestDML(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment), - LinearDRLearner(binary_outcome=binary_outcome) + LinearDML(discrete_outcome=discrete_outcome, discrete_treatment=discrete_treatment), + CausalForestDML(discrete_outcome=discrete_outcome, discrete_treatment=discrete_treatment), + LinearDRLearner(discrete_outcome=discrete_outcome) ] for est in ests: @@ -60,7 +60,7 @@ def test_accuracy(self): # accuracy test, DML def test_accuracy_iv(self): n = 10000 - binary_outcome = True + discrete_outcome = True discrete_treatment = True true_ate = 0.3 W = np.random.uniform(-1, 1, size=(n, 1)) @@ -69,8 +69,8 @@ def test_accuracy_iv(self): Y = np.random.binomial(1, .5 + true_ate * D + .1 * W[:, 0], size=(n,)) ests = [ - OrthoIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment), - LinearDRIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment), + OrthoIV(discrete_outcome=discrete_outcome, discrete_treatment=discrete_treatment), + LinearDRIV(discrete_outcome=discrete_outcome, discrete_treatment=discrete_treatment), ] for est in ests: @@ -91,12 +91,12 @@ def test_string_outcome(self): D = np.random.binomial(1, .5 + .1 * W[:, 0], size=(n,)) Y = np.random.binomial(1, .5 + true_ate * D + .1 * W[:, 0], size=(n,)) Y_str = pd.Series(Y).replace(0, 'a').replace(1, 'b').values - est = LinearDML(binary_outcome=True, discrete_treatment=True) + est = LinearDML(discrete_outcome=True, discrete_treatment=True) est.fit(Y_str, D, X=W) def test_basic_functionality(self): n = 100 - binary_outcome = True + discrete_outcome = True d_x = 3 def gen_array(n, is_binary, d): @@ -110,7 +110,7 @@ def gen_array(n, is_binary, d): for discrete_treatment in [True, False]: for discrete_instrument in [True, False, None]: - Y = gen_array(n, binary_outcome, d=0) + Y = gen_array(n, discrete_outcome, d=0) T = gen_array(n, discrete_treatment, d=0) Z = None if discrete_instrument is not None: @@ -119,43 +119,43 @@ def gen_array(n, is_binary, d): if Z is not None: est_list = [ - DRIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment, + DRIV(discrete_outcome=discrete_outcome, discrete_treatment=discrete_treatment, discrete_instrument=discrete_instrument), - DMLIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment, + DMLIV(discrete_outcome=discrete_outcome, discrete_treatment=discrete_treatment, discrete_instrument=discrete_instrument), - OrthoIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment, + OrthoIV(discrete_outcome=discrete_outcome, discrete_treatment=discrete_treatment, discrete_instrument=discrete_instrument), - LinearDRIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment, + LinearDRIV(discrete_outcome=discrete_outcome, discrete_treatment=discrete_treatment, discrete_instrument=discrete_instrument), - SparseLinearDRIV(binary_outcome=binary_outcome, + SparseLinearDRIV(discrete_outcome=discrete_outcome, discrete_treatment=discrete_treatment, discrete_instrument=discrete_instrument), - ForestDRIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment, + ForestDRIV(discrete_outcome=discrete_outcome, discrete_treatment=discrete_treatment, discrete_instrument=discrete_instrument), - OrthoIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment, + OrthoIV(discrete_outcome=discrete_outcome, discrete_treatment=discrete_treatment, discrete_instrument=discrete_instrument), # uncomment when issue #837 is resolved - # NonParamDMLIV(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment, + # NonParamDMLIV(discrete_outcome=discrete_outcome, discrete_treatment=discrete_treatment, # discrete_instrument=discrete_instrument, model_final=LinearRegression()) ] if discrete_instrument and discrete_treatment: est_list += [ - LinearIntentToTreatDRIV(binary_outcome=binary_outcome), - IntentToTreatDRIV(binary_outcome=binary_outcome), + LinearIntentToTreatDRIV(discrete_outcome=discrete_outcome), + IntentToTreatDRIV(discrete_outcome=discrete_outcome), ] else: est_list = [ - LinearDML(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment), - SparseLinearDML(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment), - CausalForestDML(binary_outcome=binary_outcome, discrete_treatment=discrete_treatment) + LinearDML(discrete_outcome=discrete_outcome, discrete_treatment=discrete_treatment), + SparseLinearDML(discrete_outcome=discrete_outcome, discrete_treatment=discrete_treatment), + CausalForestDML(discrete_outcome=discrete_outcome, discrete_treatment=discrete_treatment) ] if discrete_treatment: est_list += [ - LinearDRLearner(binary_outcome=binary_outcome), - ForestDRLearner(binary_outcome=binary_outcome), + LinearDRLearner(discrete_outcome=discrete_outcome), + ForestDRLearner(discrete_outcome=discrete_outcome), ] for est in est_list: diff --git a/econml/tests/test_missing_values.py b/econml/tests/test_missing_values.py index e8542001f..761da5dbc 100644 --- a/econml/tests/test_missing_values.py +++ b/econml/tests/test_missing_values.py @@ -123,7 +123,7 @@ def test_missing(self): # model that can handle missing values nuisance_model = make_pipeline(SimpleImputer(strategy='mean'), LinearRegression()) - OrthoLearner(binary_outcome=False, discrete_treatment=False, treatment_featurizer=None, + OrthoLearner(discrete_outcome=False, discrete_treatment=False, treatment_featurizer=None, discrete_instrument=None, categories='auto', cv=3, random_state=1, allow_missing=True).fit(y, T, W=W_missing) diff --git a/econml/tests/test_ortho_learner.py b/econml/tests/test_ortho_learner.py index 84017172a..08cc306ef 100644 --- a/econml/tests/test_ortho_learner.py +++ b/econml/tests/test_ortho_learner.py @@ -2,7 +2,6 @@ # Licensed under the MIT License. from sklearn.datasets import make_regression - from econml._ortho_learner import _OrthoLearner, _crossfit from sklearn.linear_model import LinearRegression from sklearn.preprocessing import PolynomialFeatures @@ -256,7 +255,7 @@ def _gen_ortho_learner_model_final(self): sigma = 0.1 y = X[:, 0] + X[:, 1] + np.random.normal(0, sigma, size=(10000,)) - est = OrthoLearner(cv=2, binary_outcome=False, discrete_treatment=False, treatment_featurizer=None, + est = OrthoLearner(cv=2, discrete_outcome=False, discrete_treatment=False, treatment_featurizer=None, discrete_instrument=False, categories='auto', random_state=None, use_ray=use_ray) est.fit(y, X[:, 0], W=X[:, 1:]) np.testing.assert_almost_equal(est.const_marginal_effect(), 1, decimal=3) @@ -273,7 +272,7 @@ def _gen_ortho_learner_model_final(self): X = np.random.normal(size=(10000, 3)) sigma = 0.1 y = X[:, 0] + X[:, 1] + np.random.normal(0, sigma, size=(10000,)) - est = OrthoLearner(cv=2, binary_outcome=False, discrete_treatment=False, treatment_featurizer=None, + est = OrthoLearner(cv=2, discrete_outcome=False, discrete_treatment=False, treatment_featurizer=None, discrete_instrument=False, categories='auto', random_state=None, use_ray=use_ray) # test non-array inputs est.fit(list(y), list(X[:, 0]), X=None, W=X[:, 1:]) @@ -289,7 +288,7 @@ def _gen_ortho_learner_model_final(self): X = np.random.normal(size=(10000, 3)) sigma = 0.1 y = X[:, 0] + X[:, 1] + np.random.normal(0, sigma, size=(10000,)) - est = OrthoLearner(cv=KFold(n_splits=3), binary_outcome=False, + est = OrthoLearner(cv=KFold(n_splits=3), discrete_outcome=False, discrete_treatment=False, treatment_featurizer=None, discrete_instrument=False, categories='auto', random_state=None, use_ray=use_ray) est.fit(y, X[:, 0], X=None, W=X[:, 1:]) @@ -306,7 +305,7 @@ def _gen_ortho_learner_model_final(self): sigma = 0.1 y = X[:, 0] + X[:, 1] + np.random.normal(0, sigma, size=(10000,)) folds = [(np.arange(X.shape[0] // 2), np.arange(X.shape[0] // 2, X.shape[0]))] - est = OrthoLearner(cv=KFold(n_splits=3), binary_outcome=False, + est = OrthoLearner(cv=KFold(n_splits=3), discrete_outcome=False, discrete_treatment=False, treatment_featurizer=None, discrete_instrument=False, categories='auto', random_state=None, use_ray=use_ray) @@ -363,7 +362,7 @@ def _gen_ortho_learner_model_final(self): X = np.random.normal(size=(10000, 3)) sigma = 0.1 y = X[:, 0] + X[:, 1] + np.random.normal(0, sigma, size=(10000,)) - est = OrthoLearner(cv=2, binary_outcome=False, discrete_treatment=False, + est = OrthoLearner(cv=2, discrete_outcome=False, discrete_treatment=False, treatment_featurizer=None, discrete_instrument=False, categories='auto', random_state=None) est.fit(y, X[:, 0], W=X[:, 1:]) @@ -414,7 +413,7 @@ def _gen_ortho_learner_model_final(self): X = np.random.normal(size=(10000, 3)) sigma = 0.1 y = X[:, 0] + X[:, 1] + np.random.normal(0, sigma, size=(10000,)) - est = OrthoLearner(cv=2, binary_outcome=False, discrete_treatment=False, + est = OrthoLearner(cv=2, discrete_outcome=False, discrete_treatment=False, treatment_featurizer=None, discrete_instrument=False, categories='auto', random_state=None) est.fit(y, X[:, 0], W=X[:, 1:]) @@ -477,7 +476,7 @@ def _gen_ortho_learner_model_final(self): T = np.random.binomial(1, scipy.special.expit(X[:, 0])) sigma = 0.01 y = T + X[:, 0] + np.random.normal(0, sigma, size=(10000,)) - est = OrthoLearner(cv=2, binary_outcome=False, discrete_treatment=True, + est = OrthoLearner(cv=2, discrete_outcome=False, discrete_treatment=True, treatment_featurizer=None, discrete_instrument=False, categories='auto', random_state=None) est.fit(y, T, W=X) diff --git a/econml/tests/test_treatment_featurization.py b/econml/tests/test_treatment_featurization.py index 96f496103..1127e3284 100644 --- a/econml/tests/test_treatment_featurization.py +++ b/econml/tests/test_treatment_featurization.py @@ -525,7 +525,7 @@ def _gen_ortho_learner_model_final(self): 'estimator': OrthoLearner, 'params': { 'cv': 2, - 'binary_outcome': False, + 'discrete_outcome': False, 'discrete_treatment': False, 'treatment_featurizer': None, 'discrete_instrument': False, diff --git a/econml/tests/test_utilities.py b/econml/tests/test_utilities.py index 62bb9ba7c..b80fb2c8b 100644 --- a/econml/tests/test_utilities.py +++ b/econml/tests/test_utilities.py @@ -9,7 +9,8 @@ import sparse as sp import pytest from econml.utilities import (einsum_sparse, todense, tocoo, transpose, - inverse_onehot, cross_product, transpose_dictionary, deprecated, _deprecate_positional) + inverse_onehot, cross_product, transpose_dictionary, deprecated, _deprecate_positional, + single_strata_from_discrete_arrays) from sklearn.preprocessing import OneHotEncoder @@ -177,3 +178,13 @@ def m(a, b, c=1, *args, **kwargs): m(a=1, b=2) m(1, b=2, c=3, X='other') assert not counter + + def test_single_strata_from_discrete_array(self): + T = np.repeat([[0, 1, 2]], 4, axis=0).ravel() + Z = np.repeat([[0, 1]], 6, axis=0).ravel() + Y = np.repeat([0, 1], 6, axis=0) + + assert set(single_strata_from_discrete_arrays([T, Z, Y])) == set(np.arange(12)) + assert set(single_strata_from_discrete_arrays([T, Z])) == set(np.arange(6)) + assert set(single_strata_from_discrete_arrays([T])) == set(np.arange(3)) + assert single_strata_from_discrete_arrays([]) is None diff --git a/econml/utilities.py b/econml/utilities.py index f62ffbb4d..db3f4cb49 100644 --- a/econml/utilities.py +++ b/econml/utilities.py @@ -18,7 +18,7 @@ from functools import reduce, wraps from sklearn.utils import check_array, check_X_y from sklearn.utils.validation import assert_all_finite -from sklearn.preprocessing import PolynomialFeatures +from sklearn.preprocessing import PolynomialFeatures, LabelEncoder import warnings from warnings import warn from collections.abc import Iterable @@ -1482,3 +1482,29 @@ def jacify_featurizer(featurizer): a function for calculating the jacobian """ return _TransformerWrapper(featurizer) + + +def single_strata_from_discrete_arrays(arrs): + """ + Combine multiple discrete arrays into a single array for stratification purposes: + + e.g. if arrs are + [0 1 2 0 1 2 0 1 2 0 1 2], + [0 1 0 1 0 1 0 1 0 1 0 1], + [0 0 0 0 0 0 1 1 1 1 1 1] + then output will be + [0 8 4 6 2 10 1 9 5 7 3 11] + + Every distinct combination of these discrete arrays will have it's own label. + """ + if not arrs: + return None + + curr_array = np.zeros(shape=np.ravel(arrs[0]).shape, dtype='int') + + for arr in arrs: + enc = LabelEncoder() + temp = enc.fit_transform(np.ravel(arr)) + curr_array = temp + curr_array * len(enc.classes_) + + return curr_array From 0757d39ca06aad3948a320b04e8a365b09626e3e Mon Sep 17 00:00:00 2001 From: Fabio Vera Date: Fri, 5 Jan 2024 14:07:29 -0500 Subject: [PATCH 21/25] line endings Signed-off-by: Fabio Vera --- econml/tests/test_ortho_learner.py | 972 ++++++++++++++--------------- 1 file changed, 486 insertions(+), 486 deletions(-) diff --git a/econml/tests/test_ortho_learner.py b/econml/tests/test_ortho_learner.py index 08cc306ef..0c65358ea 100644 --- a/econml/tests/test_ortho_learner.py +++ b/econml/tests/test_ortho_learner.py @@ -1,486 +1,486 @@ -# Copyright (c) PyWhy contributors. All rights reserved. -# Licensed under the MIT License. - -from sklearn.datasets import make_regression -from econml._ortho_learner import _OrthoLearner, _crossfit -from sklearn.linear_model import LinearRegression -from sklearn.preprocessing import PolynomialFeatures -from sklearn.linear_model import LinearRegression, LassoCV, Lasso -from sklearn.model_selection import KFold -import numpy as np -import unittest -import joblib -import pytest - -try: - import ray - - ray_installed = True -except ImportError: - ray_installed = False - - -class TestOrthoLearner(unittest.TestCase): - - def _test_crossfit(self, use_ray): - class Wrapper: - - def __init__(self, model): - self._model = model - - def train(self, is_selecting, X, y, Q, W=None): - self._model.fit(X, y) - return self - - def predict(self, X, y, Q, W=None): - return self._model.predict(X), y - self._model.predict(X), X - - def score(self, X, y, Q, W=None): - return self._model.score(X, y) - - np.random.seed(123) - X = np.random.normal(size=(5000, 3)) - y = X[:, 0] + np.random.normal(size=(5000,)) - folds = list(KFold(2).split(X, y)) - model = Lasso(alpha=0.01) - ray_remote_function_option = {"num_cpus": 1} - - nuisance, model_list, fitted_inds, scores = _crossfit(Wrapper(model), folds, use_ray, - ray_remote_function_option, - X, y, y, Z=None) - np.testing.assert_allclose(nuisance[0][folds[0][1]], - model.fit(X[folds[0][0]], y[folds[0][0]]).predict(X[folds[0][1]])) - np.testing.assert_allclose(nuisance[0][folds[0][0]], - model.fit(X[folds[0][1]], y[folds[0][1]]).predict(X[folds[0][0]])) - np.testing.assert_allclose(scores[0][0], model.fit(X[folds[0][0]], y[folds[0][0]]).score(X[folds[0][1]], - y[folds[0][1]])) - np.testing.assert_allclose(scores[0][1], model.fit(X[folds[0][1]], y[folds[0][1]]).score(X[folds[0][0]], - y[folds[0][0]])) - coef_ = np.zeros(X.shape[1]) - coef_[0] = 1 - [np.testing.assert_allclose(coef_, mdl._model.coef_, rtol=0, atol=0.08) for mdl in model_list] - np.testing.assert_array_equal(fitted_inds, np.arange(X.shape[0])) - - np.random.seed(123) - X = np.random.normal(size=(5000, 3)) - y = X[:, 0] + np.random.normal(size=(5000,)) - folds = list(KFold(2).split(X, y)) - model = Lasso(alpha=0.01) - nuisance, model_list, fitted_inds, scores = _crossfit(Wrapper(model), folds, use_ray, - ray_remote_function_option, - X, y, y, Z=None) - np.testing.assert_allclose(nuisance[0][folds[0][1]], - model.fit(X[folds[0][0]], y[folds[0][0]]).predict(X[folds[0][1]])) - np.testing.assert_allclose(nuisance[0][folds[0][0]], - model.fit(X[folds[0][1]], y[folds[0][1]]).predict(X[folds[0][0]])) - np.testing.assert_allclose(scores[0][0], model.fit(X[folds[0][0]], y[folds[0][0]]).score(X[folds[0][1]], - y[folds[0][1]])) - np.testing.assert_allclose(scores[0][1], model.fit(X[folds[0][1]], y[folds[0][1]]).score(X[folds[0][0]], - y[folds[0][0]])) - coef_ = np.zeros(X.shape[1]) - coef_[0] = 1 - [np.testing.assert_allclose(coef_, mdl._model.coef_, rtol=0, atol=0.08) for mdl in model_list] - np.testing.assert_array_equal(fitted_inds, np.arange(X.shape[0])) - - np.random.seed(123) - X = np.random.normal(size=(5000, 3)) - y = X[:, 0] + np.random.normal(size=(5000,)) - folds = list(KFold(2).split(X, y)) - model = Lasso(alpha=0.01) - nuisance, model_list, fitted_inds, scores = _crossfit(Wrapper(model), folds, use_ray, - ray_remote_function_option, - X, y, y, Z=None) - np.testing.assert_allclose(nuisance[0][folds[0][1]], - model.fit(X[folds[0][0]], y[folds[0][0]]).predict(X[folds[0][1]])) - np.testing.assert_allclose(nuisance[0][folds[0][0]], - model.fit(X[folds[0][1]], y[folds[0][1]]).predict(X[folds[0][0]])) - np.testing.assert_allclose(scores[0][0], model.fit(X[folds[0][0]], y[folds[0][0]]).score(X[folds[0][1]], - y[folds[0][1]])) - np.testing.assert_allclose(scores[0][1], model.fit(X[folds[0][1]], y[folds[0][1]]).score(X[folds[0][0]], - y[folds[0][0]])) - coef_ = np.zeros(X.shape[1]) - coef_[0] = 1 - [np.testing.assert_allclose(coef_, mdl._model.coef_, rtol=0, atol=0.08) for mdl in model_list] - np.testing.assert_array_equal(fitted_inds, np.arange(X.shape[0])) - - class Wrapper: - - def __init__(self, model): - self._model = model - - def train(self, is_selecting, X, y, W=None): - self._model.fit(X, y) - return self - - def predict(self, X, y, W=None): - return self._model.predict(X), y - self._model.predict(X), X - - np.random.seed(123) - X = np.random.normal(size=(5000, 3)) - y = X[:, 0] + np.random.normal(size=(5000,)) - folds = [(np.arange(X.shape[0] // 2), np.arange(X.shape[0] // 2, X.shape[0])), - (np.arange(X.shape[0] // 2), np.arange(X.shape[0] // 2, X.shape[0]))] - model = Lasso(alpha=0.01) - with pytest.raises(AttributeError) as e_info: - nuisance, model_list, fitted_inds, scores = _crossfit(Wrapper(model), folds, use_ray, - ray_remote_function_option, - X, y, y, Z=None) - - np.random.seed(123) - X = np.random.normal(size=(5000, 3)) - y = X[:, 0] + np.random.normal(size=(5000,)) - folds = [(np.arange(X.shape[0] // 2), np.arange(X.shape[0] // 2, X.shape[0])), - (np.arange(X.shape[0] // 2), np.arange(X.shape[0] // 2, X.shape[0]))] - model = Lasso(alpha=0.01) - with pytest.raises(AttributeError) as e_info: - nuisance, model_list, fitted_inds, scores = _crossfit(Wrapper(model), folds, use_ray, - ray_remote_function_option, - X, y, y, Z=None) - - np.random.seed(123) - X = np.random.normal(size=(5000, 3)) - y = X[:, 0] + np.random.normal(size=(5000,)) - folds = [(np.arange(X.shape[0]), np.arange(X.shape[0]))] - model = Lasso(alpha=0.01) - with pytest.raises(AttributeError) as e_info: - nuisance, model_list, fitted_inds, scores = _crossfit(Wrapper(model), folds, use_ray, - ray_remote_function_option, - X, y, y, Z=None) - - np.random.seed(123) - X = np.random.normal(size=(5000, 3)) - y = X[:, 0] + np.random.normal(size=(5000,)) - folds = [(np.arange(X.shape[0]), np.arange(X.shape[0]))] - model = Lasso(alpha=0.01) - with pytest.raises(AttributeError) as e_info: - nuisance, model_list, fitted_inds, scores = _crossfit(Wrapper(model), folds, use_ray, - ray_remote_function_option, - X, y, y, Z=None) - - @pytest.mark.ray - def test_crossfit_with_ray(self): - try: - ray.init() - self._test_crossfit(use_ray=True) - finally: - ray.shutdown() - - def test_crossfit_without_ray(self): - self._test_crossfit(use_ray=False) - - @pytest.mark.ray - def test_crossfit_comparison(self): - try: - ray.init() # Initialize Ray - - class Wrapper: - - def __init__(self, model): - self._model = model - - def train(self, is_selecting, X, y, Q, W=None): - self._model.fit(X, y) - return self - - def predict(self, X, y, Q, W=None): - return self._model.predict(X), y - self._model.predict(X), X - - def score(self, X, y, Q, W=None): - return self._model.score(X, y) - - # Generate synthetic data - X, y = make_regression(n_samples=10, n_features=5, noise=0.1, random_state=42) - folds = list(KFold(2).split(X, y)) - model = LinearRegression() - ray_remote_function_option = {"num_cpus": 1} - - # Run _crossfit with Ray enabled - nuisance_ray, model_list_ray, fitted_inds_ray, scores_ray = _crossfit(Wrapper(model), folds, True, - ray_remote_function_option, - X, y, y, Z=None) - # Run _crossfit without Ray - nuisance_regular, model_list_regular, fitted_inds_regular, scores_regular = _crossfit(Wrapper(model), - folds, - False, {}, - X, y, y, Z=None) - # Compare the results - assert np.allclose(nuisance_ray[0], nuisance_regular[0]) - assert np.allclose(nuisance_ray[1], nuisance_regular[1]) - assert np.allclose(fitted_inds_ray, fitted_inds_regular) - assert np.allclose(scores_ray, scores_regular) - - finally: - ray.shutdown() # Shutdown Ray - - def _test_ol(self, use_ray): - class ModelNuisance: - def __init__(self, model_t, model_y): - self._model_t = model_t - self._model_y = model_y - - def train(self, is_selecting, Y, T, W=None): - self._model_t.fit(W, T) - self._model_y.fit(W, Y) - return self - - def predict(self, Y, T, W=None): - return Y - self._model_y.predict(W), T - self._model_t.predict(W) - - class ModelFinal: - - def __init__(self): - return - - def fit(self, Y, T, W=None, nuisances=None): - Y_res, T_res = nuisances - self.model = LinearRegression(fit_intercept=False).fit(T_res.reshape(-1, 1), Y_res) - return self - - def predict(self, X=None): - return self.model.coef_[0] - - def score(self, Y, T, W=None, nuisances=None): - Y_res, T_res = nuisances - return np.mean((Y_res - self.model.predict(T_res.reshape(-1, 1))) ** 2) - - class OrthoLearner(_OrthoLearner): - def _gen_ortho_learner_model_nuisance(self): - return ModelNuisance(LinearRegression(), LinearRegression()) - - def _gen_ortho_learner_model_final(self): - return ModelFinal() - - np.random.seed(123) - X = np.random.normal(size=(10000, 3)) - sigma = 0.1 - y = X[:, 0] + X[:, 1] + np.random.normal(0, sigma, size=(10000,)) - - est = OrthoLearner(cv=2, discrete_outcome=False, discrete_treatment=False, treatment_featurizer=None, - discrete_instrument=False, categories='auto', random_state=None, use_ray=use_ray) - est.fit(y, X[:, 0], W=X[:, 1:]) - np.testing.assert_almost_equal(est.const_marginal_effect(), 1, decimal=3) - np.testing.assert_array_almost_equal(est.effect(), np.ones(1), decimal=3) - np.testing.assert_array_almost_equal(est.effect(T0=0, T1=10), np.ones(1) * 10, decimal=2) - np.testing.assert_almost_equal(est.score(y, X[:, 0], W=X[:, 1:]), sigma**2, decimal=3) - np.testing.assert_almost_equal(est.score_, sigma**2, decimal=3) - np.testing.assert_almost_equal(est.ortho_learner_model_final_.model.coef_[0], 1, decimal=3) - # Nuisance model has no score method, so nuisance_scores_ should be none - assert est.nuisance_scores_ is None - - # Test non keyword based calls to fit - np.random.seed(123) - X = np.random.normal(size=(10000, 3)) - sigma = 0.1 - y = X[:, 0] + X[:, 1] + np.random.normal(0, sigma, size=(10000,)) - est = OrthoLearner(cv=2, discrete_outcome=False, discrete_treatment=False, treatment_featurizer=None, - discrete_instrument=False, categories='auto', random_state=None, use_ray=use_ray) - # test non-array inputs - est.fit(list(y), list(X[:, 0]), X=None, W=X[:, 1:]) - np.testing.assert_almost_equal(est.const_marginal_effect(), 1, decimal=3) - np.testing.assert_array_almost_equal(est.effect(), np.ones(1), decimal=3) - np.testing.assert_array_almost_equal(est.effect(T0=0, T1=10), np.ones(1) * 10, decimal=2) - np.testing.assert_almost_equal(est.score(y, X[:, 0], None, X[:, 1:]), sigma ** 2, decimal=3) - np.testing.assert_almost_equal(est.score_, sigma ** 2, decimal=3) - np.testing.assert_almost_equal(est.ortho_learner_model_final_.model.coef_[0], 1, decimal=3) - - # Test custom splitter - np.random.seed(123) - X = np.random.normal(size=(10000, 3)) - sigma = 0.1 - y = X[:, 0] + X[:, 1] + np.random.normal(0, sigma, size=(10000,)) - est = OrthoLearner(cv=KFold(n_splits=3), discrete_outcome=False, - discrete_treatment=False, treatment_featurizer=None, discrete_instrument=False, - categories='auto', random_state=None, use_ray=use_ray) - est.fit(y, X[:, 0], X=None, W=X[:, 1:]) - np.testing.assert_almost_equal(est.const_marginal_effect(), 1, decimal=3) - np.testing.assert_array_almost_equal(est.effect(), np.ones(1), decimal=3) - np.testing.assert_array_almost_equal(est.effect(T0=0, T1=10), np.ones(1) * 10, decimal=2) - np.testing.assert_almost_equal(est.score(y, X[:, 0], W=X[:, 1:]), sigma**2, decimal=3) - np.testing.assert_almost_equal(est.score_, sigma**2, decimal=3) - np.testing.assert_almost_equal(est.ortho_learner_model_final_.model.coef_[0], 1, decimal=3) - - # Test incomplete set of test folds - np.random.seed(123) - X = np.random.normal(size=(10000, 3)) - sigma = 0.1 - y = X[:, 0] + X[:, 1] + np.random.normal(0, sigma, size=(10000,)) - folds = [(np.arange(X.shape[0] // 2), np.arange(X.shape[0] // 2, X.shape[0]))] - est = OrthoLearner(cv=KFold(n_splits=3), discrete_outcome=False, - discrete_treatment=False, treatment_featurizer=None, discrete_instrument=False, - categories='auto', random_state=None, use_ray=use_ray) - - est.fit(y, X[:, 0], X=None, W=X[:, 1:]) - np.testing.assert_almost_equal(est.const_marginal_effect(), 1, decimal=2) - np.testing.assert_array_almost_equal(est.effect(), np.ones(1), decimal=2) - np.testing.assert_array_almost_equal(est.effect(T0=0, T1=10), np.ones(1) * 10, decimal=1) - np.testing.assert_almost_equal(est.score(y, X[:, 0], W=X[:, 1:]), sigma**2, decimal=2) - np.testing.assert_almost_equal(est.score_, sigma**2, decimal=2) - np.testing.assert_almost_equal(est.ortho_learner_model_final_.model.coef_[0], 1, decimal=2) - - @pytest.mark.ray - def test_ol_with_ray(self): - self._test_ol(True) - - def test_ol_without_ray(self): - self._test_ol(False) - - def test_ol_no_score_final(self): - class ModelNuisance: - def __init__(self, model_t, model_y): - self._model_t = model_t - self._model_y = model_y - - def train(self, is_selecting, Y, T, W=None): - self._model_t.fit(W, T) - self._model_y.fit(W, Y) - return self - - def predict(self, Y, T, W=None): - return Y - self._model_y.predict(W), T - self._model_t.predict(W) - - class ModelFinal: - - def __init__(self): - return - - def fit(self, Y, T, W=None, nuisances=None): - Y_res, T_res = nuisances - self.model = LinearRegression(fit_intercept=False).fit(T_res.reshape(-1, 1), Y_res) - return self - - def predict(self, X=None): - return self.model.coef_[0] - - class OrthoLearner(_OrthoLearner): - def _gen_ortho_learner_model_nuisance(self): - return ModelNuisance(LinearRegression(), LinearRegression()) - - def _gen_ortho_learner_model_final(self): - return ModelFinal() - - np.random.seed(123) - X = np.random.normal(size=(10000, 3)) - sigma = 0.1 - y = X[:, 0] + X[:, 1] + np.random.normal(0, sigma, size=(10000,)) - est = OrthoLearner(cv=2, discrete_outcome=False, discrete_treatment=False, - treatment_featurizer=None, discrete_instrument=False, - categories='auto', random_state=None) - est.fit(y, X[:, 0], W=X[:, 1:]) - np.testing.assert_almost_equal(est.const_marginal_effect(), 1, decimal=3) - np.testing.assert_array_almost_equal(est.effect(), np.ones(1), decimal=3) - np.testing.assert_array_almost_equal(est.effect(T0=0, T1=10), np.ones(1) * 10, decimal=2) - assert est.score_ is None - np.testing.assert_almost_equal(est.ortho_learner_model_final_.model.coef_[0], 1, decimal=3) - - def test_ol_nuisance_scores(self): - class ModelNuisance: - def __init__(self, model_t, model_y): - self._model_t = model_t - self._model_y = model_y - - def train(self, is_selecting, Y, T, W=None): - self._model_t.fit(W, T) - self._model_y.fit(W, Y) - return self - - def predict(self, Y, T, W=None): - return Y - self._model_y.predict(W), T - self._model_t.predict(W) - - def score(self, Y, T, W=None): - return (self._model_t.score(W, Y), self._model_y.score(W, T)) - - class ModelFinal: - - def __init__(self): - return - - def fit(self, Y, T, W=None, nuisances=None): - Y_res, T_res = nuisances - self.model = LinearRegression(fit_intercept=False).fit(T_res.reshape(-1, 1), Y_res) - return self - - def predict(self, X=None): - return self.model.coef_[0] - - class OrthoLearner(_OrthoLearner): - def _gen_ortho_learner_model_nuisance(self): - return ModelNuisance(LinearRegression(), LinearRegression()) - - def _gen_ortho_learner_model_final(self): - return ModelFinal() - - np.random.seed(123) - X = np.random.normal(size=(10000, 3)) - sigma = 0.1 - y = X[:, 0] + X[:, 1] + np.random.normal(0, sigma, size=(10000,)) - est = OrthoLearner(cv=2, discrete_outcome=False, discrete_treatment=False, - treatment_featurizer=None, discrete_instrument=False, - categories='auto', random_state=None) - est.fit(y, X[:, 0], W=X[:, 1:]) - np.testing.assert_almost_equal(est.const_marginal_effect(), 1, decimal=3) - np.testing.assert_array_almost_equal(est.effect(), np.ones(1), decimal=3) - np.testing.assert_array_almost_equal(est.effect(T0=0, T1=10), np.ones(1) * 10, decimal=2) - np.testing.assert_almost_equal(est.ortho_learner_model_final_.model.coef_[0], 1, decimal=3) - nuisance_scores_y = est.nuisance_scores_[0] - nuisance_scores_t = est.nuisance_scores_[1] - assert len(nuisance_scores_y) == len(nuisance_scores_t) == 1 # as many scores as iterations - assert len(nuisance_scores_y[0]) == len(nuisance_scores_t[0]) == 2 # as many scores as splits - # y scores should be positive, since W predicts Y somewhat - # t scores might not be, since W and T are uncorrelated - np.testing.assert_array_less(0, nuisance_scores_y[0]) - - def test_ol_discrete_treatment(self): - class ModelNuisance: - def __init__(self, model_t, model_y): - self._model_t = model_t - self._model_y = model_y - - def train(self, is_selecting, Y, T, W=None): - self._model_t.fit(W, np.matmul(T, np.arange(1, T.shape[1] + 1))) - self._model_y.fit(W, Y) - return self - - def predict(self, Y, T, W=None): - return Y - self._model_y.predict(W), T - self._model_t.predict_proba(W)[:, 1:] - - class ModelFinal: - - def __init__(self): - return - - def fit(self, Y, T, W=None, nuisances=None): - Y_res, T_res = nuisances - self.model = LinearRegression(fit_intercept=False).fit(T_res.reshape(-1, 1), Y_res) - return self - - def predict(self): - # theta needs to be of dimension (1, d_t) if T is (n, d_t) - return np.array([[self.model.coef_[0]]]) - - def score(self, Y, T, W=None, nuisances=None): - Y_res, T_res = nuisances - return np.mean((Y_res - self.model.predict(T_res.reshape(-1, 1)))**2) - - from sklearn.linear_model import LogisticRegression - - class OrthoLearner(_OrthoLearner): - def _gen_ortho_learner_model_nuisance(self): - return ModelNuisance(LogisticRegression(solver='lbfgs'), LinearRegression()) - - def _gen_ortho_learner_model_final(self): - return ModelFinal() - - np.random.seed(123) - X = np.random.normal(size=(10000, 3)) - import scipy.special - T = np.random.binomial(1, scipy.special.expit(X[:, 0])) - sigma = 0.01 - y = T + X[:, 0] + np.random.normal(0, sigma, size=(10000,)) - est = OrthoLearner(cv=2, discrete_outcome=False, discrete_treatment=True, - treatment_featurizer=None, discrete_instrument=False, - categories='auto', random_state=None) - est.fit(y, T, W=X) - np.testing.assert_almost_equal(est.const_marginal_effect(), 1, decimal=3) - np.testing.assert_array_almost_equal(est.effect(), np.ones(1), decimal=3) - np.testing.assert_almost_equal(est.score(y, T, W=X), sigma**2, decimal=3) - np.testing.assert_almost_equal(est.ortho_learner_model_final_.model.coef_[0], 1, decimal=3) +# Copyright (c) PyWhy contributors. All rights reserved. +# Licensed under the MIT License. + +from sklearn.datasets import make_regression +from econml._ortho_learner import _OrthoLearner, _crossfit +from sklearn.linear_model import LinearRegression +from sklearn.preprocessing import PolynomialFeatures +from sklearn.linear_model import LinearRegression, LassoCV, Lasso +from sklearn.model_selection import KFold +import numpy as np +import unittest +import joblib +import pytest + +try: + import ray + + ray_installed = True +except ImportError: + ray_installed = False + + +class TestOrthoLearner(unittest.TestCase): + + def _test_crossfit(self, use_ray): + class Wrapper: + + def __init__(self, model): + self._model = model + + def train(self, is_selecting, X, y, Q, W=None): + self._model.fit(X, y) + return self + + def predict(self, X, y, Q, W=None): + return self._model.predict(X), y - self._model.predict(X), X + + def score(self, X, y, Q, W=None): + return self._model.score(X, y) + + np.random.seed(123) + X = np.random.normal(size=(5000, 3)) + y = X[:, 0] + np.random.normal(size=(5000,)) + folds = list(KFold(2).split(X, y)) + model = Lasso(alpha=0.01) + ray_remote_function_option = {"num_cpus": 1} + + nuisance, model_list, fitted_inds, scores = _crossfit(Wrapper(model), folds, use_ray, + ray_remote_function_option, + X, y, y, Z=None) + np.testing.assert_allclose(nuisance[0][folds[0][1]], + model.fit(X[folds[0][0]], y[folds[0][0]]).predict(X[folds[0][1]])) + np.testing.assert_allclose(nuisance[0][folds[0][0]], + model.fit(X[folds[0][1]], y[folds[0][1]]).predict(X[folds[0][0]])) + np.testing.assert_allclose(scores[0][0], model.fit(X[folds[0][0]], y[folds[0][0]]).score(X[folds[0][1]], + y[folds[0][1]])) + np.testing.assert_allclose(scores[0][1], model.fit(X[folds[0][1]], y[folds[0][1]]).score(X[folds[0][0]], + y[folds[0][0]])) + coef_ = np.zeros(X.shape[1]) + coef_[0] = 1 + [np.testing.assert_allclose(coef_, mdl._model.coef_, rtol=0, atol=0.08) for mdl in model_list] + np.testing.assert_array_equal(fitted_inds, np.arange(X.shape[0])) + + np.random.seed(123) + X = np.random.normal(size=(5000, 3)) + y = X[:, 0] + np.random.normal(size=(5000,)) + folds = list(KFold(2).split(X, y)) + model = Lasso(alpha=0.01) + nuisance, model_list, fitted_inds, scores = _crossfit(Wrapper(model), folds, use_ray, + ray_remote_function_option, + X, y, y, Z=None) + np.testing.assert_allclose(nuisance[0][folds[0][1]], + model.fit(X[folds[0][0]], y[folds[0][0]]).predict(X[folds[0][1]])) + np.testing.assert_allclose(nuisance[0][folds[0][0]], + model.fit(X[folds[0][1]], y[folds[0][1]]).predict(X[folds[0][0]])) + np.testing.assert_allclose(scores[0][0], model.fit(X[folds[0][0]], y[folds[0][0]]).score(X[folds[0][1]], + y[folds[0][1]])) + np.testing.assert_allclose(scores[0][1], model.fit(X[folds[0][1]], y[folds[0][1]]).score(X[folds[0][0]], + y[folds[0][0]])) + coef_ = np.zeros(X.shape[1]) + coef_[0] = 1 + [np.testing.assert_allclose(coef_, mdl._model.coef_, rtol=0, atol=0.08) for mdl in model_list] + np.testing.assert_array_equal(fitted_inds, np.arange(X.shape[0])) + + np.random.seed(123) + X = np.random.normal(size=(5000, 3)) + y = X[:, 0] + np.random.normal(size=(5000,)) + folds = list(KFold(2).split(X, y)) + model = Lasso(alpha=0.01) + nuisance, model_list, fitted_inds, scores = _crossfit(Wrapper(model), folds, use_ray, + ray_remote_function_option, + X, y, y, Z=None) + np.testing.assert_allclose(nuisance[0][folds[0][1]], + model.fit(X[folds[0][0]], y[folds[0][0]]).predict(X[folds[0][1]])) + np.testing.assert_allclose(nuisance[0][folds[0][0]], + model.fit(X[folds[0][1]], y[folds[0][1]]).predict(X[folds[0][0]])) + np.testing.assert_allclose(scores[0][0], model.fit(X[folds[0][0]], y[folds[0][0]]).score(X[folds[0][1]], + y[folds[0][1]])) + np.testing.assert_allclose(scores[0][1], model.fit(X[folds[0][1]], y[folds[0][1]]).score(X[folds[0][0]], + y[folds[0][0]])) + coef_ = np.zeros(X.shape[1]) + coef_[0] = 1 + [np.testing.assert_allclose(coef_, mdl._model.coef_, rtol=0, atol=0.08) for mdl in model_list] + np.testing.assert_array_equal(fitted_inds, np.arange(X.shape[0])) + + class Wrapper: + + def __init__(self, model): + self._model = model + + def train(self, is_selecting, X, y, W=None): + self._model.fit(X, y) + return self + + def predict(self, X, y, W=None): + return self._model.predict(X), y - self._model.predict(X), X + + np.random.seed(123) + X = np.random.normal(size=(5000, 3)) + y = X[:, 0] + np.random.normal(size=(5000,)) + folds = [(np.arange(X.shape[0] // 2), np.arange(X.shape[0] // 2, X.shape[0])), + (np.arange(X.shape[0] // 2), np.arange(X.shape[0] // 2, X.shape[0]))] + model = Lasso(alpha=0.01) + with pytest.raises(AttributeError) as e_info: + nuisance, model_list, fitted_inds, scores = _crossfit(Wrapper(model), folds, use_ray, + ray_remote_function_option, + X, y, y, Z=None) + + np.random.seed(123) + X = np.random.normal(size=(5000, 3)) + y = X[:, 0] + np.random.normal(size=(5000,)) + folds = [(np.arange(X.shape[0] // 2), np.arange(X.shape[0] // 2, X.shape[0])), + (np.arange(X.shape[0] // 2), np.arange(X.shape[0] // 2, X.shape[0]))] + model = Lasso(alpha=0.01) + with pytest.raises(AttributeError) as e_info: + nuisance, model_list, fitted_inds, scores = _crossfit(Wrapper(model), folds, use_ray, + ray_remote_function_option, + X, y, y, Z=None) + + np.random.seed(123) + X = np.random.normal(size=(5000, 3)) + y = X[:, 0] + np.random.normal(size=(5000,)) + folds = [(np.arange(X.shape[0]), np.arange(X.shape[0]))] + model = Lasso(alpha=0.01) + with pytest.raises(AttributeError) as e_info: + nuisance, model_list, fitted_inds, scores = _crossfit(Wrapper(model), folds, use_ray, + ray_remote_function_option, + X, y, y, Z=None) + + np.random.seed(123) + X = np.random.normal(size=(5000, 3)) + y = X[:, 0] + np.random.normal(size=(5000,)) + folds = [(np.arange(X.shape[0]), np.arange(X.shape[0]))] + model = Lasso(alpha=0.01) + with pytest.raises(AttributeError) as e_info: + nuisance, model_list, fitted_inds, scores = _crossfit(Wrapper(model), folds, use_ray, + ray_remote_function_option, + X, y, y, Z=None) + + @pytest.mark.ray + def test_crossfit_with_ray(self): + try: + ray.init() + self._test_crossfit(use_ray=True) + finally: + ray.shutdown() + + def test_crossfit_without_ray(self): + self._test_crossfit(use_ray=False) + + @pytest.mark.ray + def test_crossfit_comparison(self): + try: + ray.init() # Initialize Ray + + class Wrapper: + + def __init__(self, model): + self._model = model + + def train(self, is_selecting, X, y, Q, W=None): + self._model.fit(X, y) + return self + + def predict(self, X, y, Q, W=None): + return self._model.predict(X), y - self._model.predict(X), X + + def score(self, X, y, Q, W=None): + return self._model.score(X, y) + + # Generate synthetic data + X, y = make_regression(n_samples=10, n_features=5, noise=0.1, random_state=42) + folds = list(KFold(2).split(X, y)) + model = LinearRegression() + ray_remote_function_option = {"num_cpus": 1} + + # Run _crossfit with Ray enabled + nuisance_ray, model_list_ray, fitted_inds_ray, scores_ray = _crossfit(Wrapper(model), folds, True, + ray_remote_function_option, + X, y, y, Z=None) + # Run _crossfit without Ray + nuisance_regular, model_list_regular, fitted_inds_regular, scores_regular = _crossfit(Wrapper(model), + folds, + False, {}, + X, y, y, Z=None) + # Compare the results + assert np.allclose(nuisance_ray[0], nuisance_regular[0]) + assert np.allclose(nuisance_ray[1], nuisance_regular[1]) + assert np.allclose(fitted_inds_ray, fitted_inds_regular) + assert np.allclose(scores_ray, scores_regular) + + finally: + ray.shutdown() # Shutdown Ray + + def _test_ol(self, use_ray): + class ModelNuisance: + def __init__(self, model_t, model_y): + self._model_t = model_t + self._model_y = model_y + + def train(self, is_selecting, Y, T, W=None): + self._model_t.fit(W, T) + self._model_y.fit(W, Y) + return self + + def predict(self, Y, T, W=None): + return Y - self._model_y.predict(W), T - self._model_t.predict(W) + + class ModelFinal: + + def __init__(self): + return + + def fit(self, Y, T, W=None, nuisances=None): + Y_res, T_res = nuisances + self.model = LinearRegression(fit_intercept=False).fit(T_res.reshape(-1, 1), Y_res) + return self + + def predict(self, X=None): + return self.model.coef_[0] + + def score(self, Y, T, W=None, nuisances=None): + Y_res, T_res = nuisances + return np.mean((Y_res - self.model.predict(T_res.reshape(-1, 1))) ** 2) + + class OrthoLearner(_OrthoLearner): + def _gen_ortho_learner_model_nuisance(self): + return ModelNuisance(LinearRegression(), LinearRegression()) + + def _gen_ortho_learner_model_final(self): + return ModelFinal() + + np.random.seed(123) + X = np.random.normal(size=(10000, 3)) + sigma = 0.1 + y = X[:, 0] + X[:, 1] + np.random.normal(0, sigma, size=(10000,)) + + est = OrthoLearner(cv=2, discrete_outcome=False, discrete_treatment=False, treatment_featurizer=None, + discrete_instrument=False, categories='auto', random_state=None, use_ray=use_ray) + est.fit(y, X[:, 0], W=X[:, 1:]) + np.testing.assert_almost_equal(est.const_marginal_effect(), 1, decimal=3) + np.testing.assert_array_almost_equal(est.effect(), np.ones(1), decimal=3) + np.testing.assert_array_almost_equal(est.effect(T0=0, T1=10), np.ones(1) * 10, decimal=2) + np.testing.assert_almost_equal(est.score(y, X[:, 0], W=X[:, 1:]), sigma**2, decimal=3) + np.testing.assert_almost_equal(est.score_, sigma**2, decimal=3) + np.testing.assert_almost_equal(est.ortho_learner_model_final_.model.coef_[0], 1, decimal=3) + # Nuisance model has no score method, so nuisance_scores_ should be none + assert est.nuisance_scores_ is None + + # Test non keyword based calls to fit + np.random.seed(123) + X = np.random.normal(size=(10000, 3)) + sigma = 0.1 + y = X[:, 0] + X[:, 1] + np.random.normal(0, sigma, size=(10000,)) + est = OrthoLearner(cv=2, discrete_outcome=False, discrete_treatment=False, treatment_featurizer=None, + discrete_instrument=False, categories='auto', random_state=None, use_ray=use_ray) + # test non-array inputs + est.fit(list(y), list(X[:, 0]), X=None, W=X[:, 1:]) + np.testing.assert_almost_equal(est.const_marginal_effect(), 1, decimal=3) + np.testing.assert_array_almost_equal(est.effect(), np.ones(1), decimal=3) + np.testing.assert_array_almost_equal(est.effect(T0=0, T1=10), np.ones(1) * 10, decimal=2) + np.testing.assert_almost_equal(est.score(y, X[:, 0], None, X[:, 1:]), sigma ** 2, decimal=3) + np.testing.assert_almost_equal(est.score_, sigma ** 2, decimal=3) + np.testing.assert_almost_equal(est.ortho_learner_model_final_.model.coef_[0], 1, decimal=3) + + # Test custom splitter + np.random.seed(123) + X = np.random.normal(size=(10000, 3)) + sigma = 0.1 + y = X[:, 0] + X[:, 1] + np.random.normal(0, sigma, size=(10000,)) + est = OrthoLearner(cv=KFold(n_splits=3), discrete_outcome=False, + discrete_treatment=False, treatment_featurizer=None, discrete_instrument=False, + categories='auto', random_state=None, use_ray=use_ray) + est.fit(y, X[:, 0], X=None, W=X[:, 1:]) + np.testing.assert_almost_equal(est.const_marginal_effect(), 1, decimal=3) + np.testing.assert_array_almost_equal(est.effect(), np.ones(1), decimal=3) + np.testing.assert_array_almost_equal(est.effect(T0=0, T1=10), np.ones(1) * 10, decimal=2) + np.testing.assert_almost_equal(est.score(y, X[:, 0], W=X[:, 1:]), sigma**2, decimal=3) + np.testing.assert_almost_equal(est.score_, sigma**2, decimal=3) + np.testing.assert_almost_equal(est.ortho_learner_model_final_.model.coef_[0], 1, decimal=3) + + # Test incomplete set of test folds + np.random.seed(123) + X = np.random.normal(size=(10000, 3)) + sigma = 0.1 + y = X[:, 0] + X[:, 1] + np.random.normal(0, sigma, size=(10000,)) + folds = [(np.arange(X.shape[0] // 2), np.arange(X.shape[0] // 2, X.shape[0]))] + est = OrthoLearner(cv=KFold(n_splits=3), discrete_outcome=False, + discrete_treatment=False, treatment_featurizer=None, discrete_instrument=False, + categories='auto', random_state=None, use_ray=use_ray) + + est.fit(y, X[:, 0], X=None, W=X[:, 1:]) + np.testing.assert_almost_equal(est.const_marginal_effect(), 1, decimal=2) + np.testing.assert_array_almost_equal(est.effect(), np.ones(1), decimal=2) + np.testing.assert_array_almost_equal(est.effect(T0=0, T1=10), np.ones(1) * 10, decimal=1) + np.testing.assert_almost_equal(est.score(y, X[:, 0], W=X[:, 1:]), sigma**2, decimal=2) + np.testing.assert_almost_equal(est.score_, sigma**2, decimal=2) + np.testing.assert_almost_equal(est.ortho_learner_model_final_.model.coef_[0], 1, decimal=2) + + @pytest.mark.ray + def test_ol_with_ray(self): + self._test_ol(True) + + def test_ol_without_ray(self): + self._test_ol(False) + + def test_ol_no_score_final(self): + class ModelNuisance: + def __init__(self, model_t, model_y): + self._model_t = model_t + self._model_y = model_y + + def train(self, is_selecting, Y, T, W=None): + self._model_t.fit(W, T) + self._model_y.fit(W, Y) + return self + + def predict(self, Y, T, W=None): + return Y - self._model_y.predict(W), T - self._model_t.predict(W) + + class ModelFinal: + + def __init__(self): + return + + def fit(self, Y, T, W=None, nuisances=None): + Y_res, T_res = nuisances + self.model = LinearRegression(fit_intercept=False).fit(T_res.reshape(-1, 1), Y_res) + return self + + def predict(self, X=None): + return self.model.coef_[0] + + class OrthoLearner(_OrthoLearner): + def _gen_ortho_learner_model_nuisance(self): + return ModelNuisance(LinearRegression(), LinearRegression()) + + def _gen_ortho_learner_model_final(self): + return ModelFinal() + + np.random.seed(123) + X = np.random.normal(size=(10000, 3)) + sigma = 0.1 + y = X[:, 0] + X[:, 1] + np.random.normal(0, sigma, size=(10000,)) + est = OrthoLearner(cv=2, discrete_outcome=False, discrete_treatment=False, + treatment_featurizer=None, discrete_instrument=False, + categories='auto', random_state=None) + est.fit(y, X[:, 0], W=X[:, 1:]) + np.testing.assert_almost_equal(est.const_marginal_effect(), 1, decimal=3) + np.testing.assert_array_almost_equal(est.effect(), np.ones(1), decimal=3) + np.testing.assert_array_almost_equal(est.effect(T0=0, T1=10), np.ones(1) * 10, decimal=2) + assert est.score_ is None + np.testing.assert_almost_equal(est.ortho_learner_model_final_.model.coef_[0], 1, decimal=3) + + def test_ol_nuisance_scores(self): + class ModelNuisance: + def __init__(self, model_t, model_y): + self._model_t = model_t + self._model_y = model_y + + def train(self, is_selecting, Y, T, W=None): + self._model_t.fit(W, T) + self._model_y.fit(W, Y) + return self + + def predict(self, Y, T, W=None): + return Y - self._model_y.predict(W), T - self._model_t.predict(W) + + def score(self, Y, T, W=None): + return (self._model_t.score(W, Y), self._model_y.score(W, T)) + + class ModelFinal: + + def __init__(self): + return + + def fit(self, Y, T, W=None, nuisances=None): + Y_res, T_res = nuisances + self.model = LinearRegression(fit_intercept=False).fit(T_res.reshape(-1, 1), Y_res) + return self + + def predict(self, X=None): + return self.model.coef_[0] + + class OrthoLearner(_OrthoLearner): + def _gen_ortho_learner_model_nuisance(self): + return ModelNuisance(LinearRegression(), LinearRegression()) + + def _gen_ortho_learner_model_final(self): + return ModelFinal() + + np.random.seed(123) + X = np.random.normal(size=(10000, 3)) + sigma = 0.1 + y = X[:, 0] + X[:, 1] + np.random.normal(0, sigma, size=(10000,)) + est = OrthoLearner(cv=2, discrete_outcome=False, discrete_treatment=False, + treatment_featurizer=None, discrete_instrument=False, + categories='auto', random_state=None) + est.fit(y, X[:, 0], W=X[:, 1:]) + np.testing.assert_almost_equal(est.const_marginal_effect(), 1, decimal=3) + np.testing.assert_array_almost_equal(est.effect(), np.ones(1), decimal=3) + np.testing.assert_array_almost_equal(est.effect(T0=0, T1=10), np.ones(1) * 10, decimal=2) + np.testing.assert_almost_equal(est.ortho_learner_model_final_.model.coef_[0], 1, decimal=3) + nuisance_scores_y = est.nuisance_scores_[0] + nuisance_scores_t = est.nuisance_scores_[1] + assert len(nuisance_scores_y) == len(nuisance_scores_t) == 1 # as many scores as iterations + assert len(nuisance_scores_y[0]) == len(nuisance_scores_t[0]) == 2 # as many scores as splits + # y scores should be positive, since W predicts Y somewhat + # t scores might not be, since W and T are uncorrelated + np.testing.assert_array_less(0, nuisance_scores_y[0]) + + def test_ol_discrete_treatment(self): + class ModelNuisance: + def __init__(self, model_t, model_y): + self._model_t = model_t + self._model_y = model_y + + def train(self, is_selecting, Y, T, W=None): + self._model_t.fit(W, np.matmul(T, np.arange(1, T.shape[1] + 1))) + self._model_y.fit(W, Y) + return self + + def predict(self, Y, T, W=None): + return Y - self._model_y.predict(W), T - self._model_t.predict_proba(W)[:, 1:] + + class ModelFinal: + + def __init__(self): + return + + def fit(self, Y, T, W=None, nuisances=None): + Y_res, T_res = nuisances + self.model = LinearRegression(fit_intercept=False).fit(T_res.reshape(-1, 1), Y_res) + return self + + def predict(self): + # theta needs to be of dimension (1, d_t) if T is (n, d_t) + return np.array([[self.model.coef_[0]]]) + + def score(self, Y, T, W=None, nuisances=None): + Y_res, T_res = nuisances + return np.mean((Y_res - self.model.predict(T_res.reshape(-1, 1)))**2) + + from sklearn.linear_model import LogisticRegression + + class OrthoLearner(_OrthoLearner): + def _gen_ortho_learner_model_nuisance(self): + return ModelNuisance(LogisticRegression(solver='lbfgs'), LinearRegression()) + + def _gen_ortho_learner_model_final(self): + return ModelFinal() + + np.random.seed(123) + X = np.random.normal(size=(10000, 3)) + import scipy.special + T = np.random.binomial(1, scipy.special.expit(X[:, 0])) + sigma = 0.01 + y = T + X[:, 0] + np.random.normal(0, sigma, size=(10000,)) + est = OrthoLearner(cv=2, discrete_outcome=False, discrete_treatment=True, + treatment_featurizer=None, discrete_instrument=False, + categories='auto', random_state=None) + est.fit(y, T, W=X) + np.testing.assert_almost_equal(est.const_marginal_effect(), 1, decimal=3) + np.testing.assert_array_almost_equal(est.effect(), np.ones(1), decimal=3) + np.testing.assert_almost_equal(est.score(y, T, W=X), sigma**2, decimal=3) + np.testing.assert_almost_equal(est.ortho_learner_model_final_.model.coef_[0], 1, decimal=3) From b848e734d67b292426aca2dcc7b5ba204543b4b8 Mon Sep 17 00:00:00 2001 From: Fabio Vera Date: Tue, 9 Jan 2024 14:58:58 -0500 Subject: [PATCH 22/25] fix tests where clf was used without specifying disc treat Signed-off-by: Fabio Vera --- econml/tests/test_drtester.py | 12 ++- econml/tests/test_federated_learning.py | 11 ++- econml/tests/test_missing_values.py | 3 +- econml/tests/test_refit.py | 4 +- notebooks/CATE validation.ipynb | 116 ++++++++---------------- 5 files changed, 60 insertions(+), 86 deletions(-) diff --git a/econml/tests/test_drtester.py b/econml/tests/test_drtester.py index 9e890c190..cc66cfe6a 100644 --- a/econml/tests/test_drtester.py +++ b/econml/tests/test_drtester.py @@ -65,7 +65,8 @@ def test_multi(self): cate = DML( model_y=reg_y, model_t=reg_t, - model_final=reg_y + model_final=reg_y, + discrete_treatment=True ).fit(Y=Ytrain, T=Dtrain, X=Xtrain) # test the DR outcome difference @@ -114,7 +115,8 @@ def test_binary(self): cate = DML( model_y=reg_y, model_t=reg_t, - model_final=reg_y + model_final=reg_y, + discrete_treatment=True ).fit(Y=Ytrain, T=Dtrain, X=Xtrain) # test the DR outcome difference @@ -158,7 +160,8 @@ def test_nuisance_val_fit(self): cate = DML( model_y=reg_y, model_t=reg_t, - model_final=reg_y + model_final=reg_y, + discrete_treatment=True ).fit(Y=Ytrain, T=Dtrain, X=Xtrain) # test the DR outcome difference @@ -198,7 +201,8 @@ def test_exceptions(self): cate = DML( model_y=reg_y, model_t=reg_t, - model_final=reg_y + model_final=reg_y, + discrete_treatment=True ).fit(Y=Ytrain, T=Dtrain, X=Xtrain) # test the DR outcome difference diff --git a/econml/tests/test_federated_learning.py b/econml/tests/test_federated_learning.py index 71c674e69..27f656945 100644 --- a/econml/tests/test_federated_learning.py +++ b/econml/tests/test_federated_learning.py @@ -23,6 +23,13 @@ def fit(self, X, y, sample_weight=None): def predict(self, X): return self.func(X) + +class FunctionClassifier(FunctionRegressor): + """A simple model that ignores the data it is fitted on, always just using the specified function to predict""" + + def __init__(self, func): + self.func = func + def predict_proba(self, X): return self.func(X) @@ -62,8 +69,8 @@ def test_lineardrlearner(self): a = np.random.normal(size=(n_x + n_w, n_t)) b = np.random.normal(size=(n_x + n_w + n_t - 1)) - t_model = FunctionRegressor(lambda XW: np.exp(XW @ a)) - y_model = FunctionRegressor(lambda XW: XW @ b) + t_model = FunctionClassifier(lambda XW: np.exp(XW @ a)) + y_model = FunctionClassifier(lambda XW: XW @ b) for cov_type in ['HC0', 'HC1', 'nonrobust']: with self.subTest(n_t=n_t, cov_type=cov_type): diff --git a/econml/tests/test_missing_values.py b/econml/tests/test_missing_values.py index 761da5dbc..e59c8811c 100644 --- a/econml/tests/test_missing_values.py +++ b/econml/tests/test_missing_values.py @@ -166,7 +166,8 @@ def test_missing2(self): x_w_missing_models = [ NonParamDML(model_y=regr, model_t=clsf, model_final=non_param_model_final, discrete_treatment=discrete_treatment, allow_missing=True), - DML(model_y=regr, model_t=clsf, model_final=param_model_final, allow_missing=True), + DML(model_y=regr, model_t=clsf, discrete_treatment=discrete_treatment, + model_final=param_model_final, allow_missing=True), DMLIV(model_y_xw=regr, model_t_xw=clsf, model_t_xwz=clsf, model_final=param_model_final, discrete_treatment=discrete_treatment, discrete_instrument=discrete_instrument, allow_missing=True), diff --git a/econml/tests/test_refit.py b/econml/tests/test_refit.py index 00cc81dff..5f473200e 100644 --- a/econml/tests/test_refit.py +++ b/econml/tests/test_refit.py @@ -265,8 +265,8 @@ def test_can_set_discrete_treatment(self): est.fit(y, T, X=X, W=W) est.effect(X) est.discrete_treatment = False - est.fit(y, T, X=X, W=W) - est.effect(X) + with pytest.raises(AttributeError): + est.fit(y, T, X=X, W=W) # should fail because passing a clf when discrete_treatment=False def test_refit_final_inference(self): """Test that we can perform inference during refit_final""" diff --git a/notebooks/CATE validation.ipynb b/notebooks/CATE validation.ipynb index 57b20444b..07c9ba86f 100644 --- a/notebooks/CATE validation.ipynb +++ b/notebooks/CATE validation.ipynb @@ -13,44 +13,7 @@ }, "scrolled": true }, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "/opt/anaconda3/envs/cate_test/lib/python3.9/site-packages/shap/utils/_clustering.py:35: NumbaDeprecationWarning: The 'nopython' keyword argument was not supplied to the 'numba.jit' decorator. The implicit default value for this argument is currently False, but it will be changed to True in Numba 0.59.0. See https://numba.readthedocs.io/en/stable/reference/deprecation.html#deprecation-of-object-mode-fall-back-behaviour-when-using-jit for details.\n", - " def _pt_shuffle_rec(i, indexes, index_mask, partition_tree, M, pos):\n", - "/opt/anaconda3/envs/cate_test/lib/python3.9/site-packages/shap/utils/_clustering.py:54: NumbaDeprecationWarning: The 'nopython' keyword argument was not supplied to the 'numba.jit' decorator. The implicit default value for this argument is currently False, but it will be changed to True in Numba 0.59.0. See https://numba.readthedocs.io/en/stable/reference/deprecation.html#deprecation-of-object-mode-fall-back-behaviour-when-using-jit for details.\n", - " def delta_minimization_order(all_masks, max_swap_size=100, num_passes=2):\n", - "/opt/anaconda3/envs/cate_test/lib/python3.9/site-packages/shap/utils/_clustering.py:63: NumbaDeprecationWarning: The 'nopython' keyword argument was not supplied to the 'numba.jit' decorator. The implicit default value for this argument is currently False, but it will be changed to True in Numba 0.59.0. See https://numba.readthedocs.io/en/stable/reference/deprecation.html#deprecation-of-object-mode-fall-back-behaviour-when-using-jit for details.\n", - " def _reverse_window(order, start, length):\n", - "/opt/anaconda3/envs/cate_test/lib/python3.9/site-packages/shap/utils/_clustering.py:69: NumbaDeprecationWarning: The 'nopython' keyword argument was not supplied to the 'numba.jit' decorator. The implicit default value for this argument is currently False, but it will be changed to True in Numba 0.59.0. See https://numba.readthedocs.io/en/stable/reference/deprecation.html#deprecation-of-object-mode-fall-back-behaviour-when-using-jit for details.\n", - " def _reverse_window_score_gain(masks, order, start, length):\n", - "/opt/anaconda3/envs/cate_test/lib/python3.9/site-packages/shap/utils/_clustering.py:77: NumbaDeprecationWarning: The 'nopython' keyword argument was not supplied to the 'numba.jit' decorator. The implicit default value for this argument is currently False, but it will be changed to True in Numba 0.59.0. See https://numba.readthedocs.io/en/stable/reference/deprecation.html#deprecation-of-object-mode-fall-back-behaviour-when-using-jit for details.\n", - " def _mask_delta_score(m1, m2):\n", - "/opt/anaconda3/envs/cate_test/lib/python3.9/site-packages/shap/links.py:5: NumbaDeprecationWarning: The 'nopython' keyword argument was not supplied to the 'numba.jit' decorator. The implicit default value for this argument is currently False, but it will be changed to True in Numba 0.59.0. See https://numba.readthedocs.io/en/stable/reference/deprecation.html#deprecation-of-object-mode-fall-back-behaviour-when-using-jit for details.\n", - " def identity(x):\n", - "/opt/anaconda3/envs/cate_test/lib/python3.9/site-packages/shap/links.py:10: NumbaDeprecationWarning: The 'nopython' keyword argument was not supplied to the 'numba.jit' decorator. The implicit default value for this argument is currently False, but it will be changed to True in Numba 0.59.0. See https://numba.readthedocs.io/en/stable/reference/deprecation.html#deprecation-of-object-mode-fall-back-behaviour-when-using-jit for details.\n", - " def _identity_inverse(x):\n", - "/opt/anaconda3/envs/cate_test/lib/python3.9/site-packages/shap/links.py:15: NumbaDeprecationWarning: The 'nopython' keyword argument was not supplied to the 'numba.jit' decorator. The implicit default value for this argument is currently False, but it will be changed to True in Numba 0.59.0. See https://numba.readthedocs.io/en/stable/reference/deprecation.html#deprecation-of-object-mode-fall-back-behaviour-when-using-jit for details.\n", - " def logit(x):\n", - "/opt/anaconda3/envs/cate_test/lib/python3.9/site-packages/shap/links.py:20: NumbaDeprecationWarning: The 'nopython' keyword argument was not supplied to the 'numba.jit' decorator. The implicit default value for this argument is currently False, but it will be changed to True in Numba 0.59.0. See https://numba.readthedocs.io/en/stable/reference/deprecation.html#deprecation-of-object-mode-fall-back-behaviour-when-using-jit for details.\n", - " def _logit_inverse(x):\n", - "/opt/anaconda3/envs/cate_test/lib/python3.9/site-packages/shap/utils/_masked_model.py:362: NumbaDeprecationWarning: The 'nopython' keyword argument was not supplied to the 'numba.jit' decorator. The implicit default value for this argument is currently False, but it will be changed to True in Numba 0.59.0. See https://numba.readthedocs.io/en/stable/reference/deprecation.html#deprecation-of-object-mode-fall-back-behaviour-when-using-jit for details.\n", - " def _build_fixed_single_output(averaged_outs, last_outs, outputs, batch_positions, varying_rows, num_varying_rows, link, linearizing_weights):\n", - "/opt/anaconda3/envs/cate_test/lib/python3.9/site-packages/shap/utils/_masked_model.py:384: NumbaDeprecationWarning: The 'nopython' keyword argument was not supplied to the 'numba.jit' decorator. The implicit default value for this argument is currently False, but it will be changed to True in Numba 0.59.0. See https://numba.readthedocs.io/en/stable/reference/deprecation.html#deprecation-of-object-mode-fall-back-behaviour-when-using-jit for details.\n", - " def _build_fixed_multi_output(averaged_outs, last_outs, outputs, batch_positions, varying_rows, num_varying_rows, link, linearizing_weights):\n", - "/opt/anaconda3/envs/cate_test/lib/python3.9/site-packages/shap/maskers/_tabular.py:185: NumbaDeprecationWarning: The 'nopython' keyword argument was not supplied to the 'numba.jit' decorator. The implicit default value for this argument is currently False, but it will be changed to True in Numba 0.59.0. See https://numba.readthedocs.io/en/stable/reference/deprecation.html#deprecation-of-object-mode-fall-back-behaviour-when-using-jit for details.\n", - " def _single_delta_mask(dind, masked_inputs, last_mask, data, x, noop_code):\n", - "/opt/anaconda3/envs/cate_test/lib/python3.9/site-packages/shap/maskers/_tabular.py:196: NumbaDeprecationWarning: The 'nopython' keyword argument was not supplied to the 'numba.jit' decorator. The implicit default value for this argument is currently False, but it will be changed to True in Numba 0.59.0. See https://numba.readthedocs.io/en/stable/reference/deprecation.html#deprecation-of-object-mode-fall-back-behaviour-when-using-jit for details.\n", - " def _delta_masking(masks, x, curr_delta_inds, varying_rows_out,\n", - "/opt/anaconda3/envs/cate_test/lib/python3.9/site-packages/tqdm/auto.py:21: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n", - " from .autonotebook import tqdm as notebook_tqdm\n", - "The 'nopython' keyword argument was not supplied to the 'numba.jit' decorator. The implicit default value for this argument is currently False, but it will be changed to True in Numba 0.59.0. See https://numba.readthedocs.io/en/stable/reference/deprecation.html#deprecation-of-object-mode-fall-back-behaviour-when-using-jit for details.\n", - "The 'nopython' keyword argument was not supplied to the 'numba.jit' decorator. The implicit default value for this argument is currently False, but it will be changed to True in Numba 0.59.0. See https://numba.readthedocs.io/en/stable/reference/deprecation.html#deprecation-of-object-mode-fall-back-behaviour-when-using-jit for details.\n" - ] - } - ], + "outputs": [], "source": [ "import numpy as np\n", "import pandas as pd\n", @@ -166,14 +129,13 @@ "name": "stderr", "output_type": "stream", "text": [ - "`sparse` was renamed to `sparse_output` in version 1.2 and will be removed in 1.4. `sparse_output` is ignored unless you leave `sparse` to its default value.\n", "The final model has a nonzero intercept for at least one outcome; it will be subtracted, but consider fitting a model without an intercept if possible.\n" ] }, { "data": { "text/plain": [ - "" + "" ] }, "execution_count": 4, @@ -183,7 +145,7 @@ ], "source": [ "est_t = TLearner(models=model_regression)\n", - "est_dm = DML(model_y=model_regression, model_t=model_propensity, model_final=model_regression)\n", + "est_dm = DML(model_y=model_regression, model_t=model_propensity, model_final=model_regression, discrete_treatment=True)\n", "\n", "est_t.fit(Ytrain, Dtrain, X=Xtrain)\n", "est_dm.fit(Ytrain, Dtrain, X=Xtrain)" @@ -236,24 +198,24 @@ " \n", " 0\n", " 1\n", - " -0.137\n", - " 0.142\n", - " 0.335\n", - " -0.015\n", - " 0.021\n", - " 0.242\n", - " -5.506\n", + " 0.078\n", + " 0.220\n", + " 0.722\n", + " -0.011\n", + " 0.023\n", + " 0.322\n", + " -9.163\n", " \n", " \n", " 1\n", " 2\n", - " 1.209\n", - " 0.095\n", + " 1.003\n", + " 0.062\n", " 0.000\n", - " 0.373\n", + " 0.375\n", " 0.024\n", " 0.000\n", - " 0.090\n", + " -0.178\n", " \n", " \n", "\n", @@ -261,12 +223,12 @@ ], "text/plain": [ " treatment blp_est blp_se blp_pval qini_est qini_se qini_pval \\\n", - "0 1 -0.137 0.142 0.335 -0.015 0.021 0.242 \n", - "1 2 1.209 0.095 0.000 0.373 0.024 0.000 \n", + "0 1 0.078 0.220 0.722 -0.011 0.023 0.322 \n", + "1 2 1.003 0.062 0.000 0.375 0.024 0.000 \n", "\n", " cal_r_squared \n", - "0 -5.506 \n", - "1 0.090 " + "0 -9.163 \n", + "1 -0.178 " ] }, "execution_count": 5, @@ -294,7 +256,7 @@ { "data": { "text/plain": [ - "" + "" ] }, "execution_count": 6, @@ -303,7 +265,7 @@ }, { "data": { - "image/png": "", + "image/png": "", "text/plain": [ "
" ] @@ -324,7 +286,7 @@ { "data": { "text/plain": [ - "" + "" ] }, "execution_count": 7, @@ -333,7 +295,7 @@ }, { "data": { - "image/png": "", + "image/png": "", "text/plain": [ "
" ] @@ -401,24 +363,24 @@ " \n", " 0\n", " 1\n", - " -0.185\n", + " -0.184\n", " 0.111\n", - " 0.096\n", + " 0.098\n", " -0.044\n", " 0.022\n", - " 0.023\n", - " -2.747\n", + " 0.022\n", + " -2.623\n", " \n", " \n", " 1\n", " 2\n", - " 0.716\n", + " 0.717\n", " 0.060\n", " 0.000\n", " 0.371\n", " 0.025\n", " 0.000\n", - " 0.626\n", + " 0.627\n", " \n", " \n", "\n", @@ -426,12 +388,12 @@ ], "text/plain": [ " treatment blp_est blp_se blp_pval qini_est qini_se qini_pval \\\n", - "0 1 -0.185 0.111 0.096 -0.044 0.022 0.023 \n", - "1 2 0.716 0.060 0.000 0.371 0.025 0.000 \n", + "0 1 -0.184 0.111 0.098 -0.044 0.022 0.022 \n", + "1 2 0.717 0.060 0.000 0.371 0.025 0.000 \n", "\n", " cal_r_squared \n", - "0 -2.747 \n", - "1 0.626 " + "0 -2.623 \n", + "1 0.627 " ] }, "execution_count": 8, @@ -459,7 +421,7 @@ { "data": { "text/plain": [ - "" + "" ] }, "execution_count": 9, @@ -468,7 +430,7 @@ }, { "data": { - "image/png": "", + "image/png": "", "text/plain": [ "
" ] @@ -489,7 +451,7 @@ { "data": { "text/plain": [ - "" + "" ] }, "execution_count": 10, @@ -498,7 +460,7 @@ }, { "data": { - "image/png": "", + "image/png": "", "text/plain": [ "
" ] @@ -521,7 +483,7 @@ ], "metadata": { "kernelspec": { - "display_name": "Python 3 (ipykernel)", + "display_name": "dev_env", "language": "python", "name": "python3" }, @@ -535,9 +497,9 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.9.17" + "version": "3.10.9" } }, "nbformat": 4, "nbformat_minor": 4 -} \ No newline at end of file +} From 12dae44c5c4ec161263ac32b5115dc20c19320cd Mon Sep 17 00:00:00 2001 From: Fabio Vera Date: Wed, 10 Jan 2024 15:45:27 -0500 Subject: [PATCH 23/25] rename function, fix warning Signed-off-by: Fabio Vera --- econml/_ortho_learner.py | 6 +++--- econml/tests/test_utilities.py | 10 +++++----- econml/utilities.py | 2 +- 3 files changed, 9 insertions(+), 9 deletions(-) diff --git a/econml/_ortho_learner.py b/econml/_ortho_learner.py index 76a51a374..9a53f1f70 100644 --- a/econml/_ortho_learner.py +++ b/econml/_ortho_learner.py @@ -43,7 +43,7 @@ class in this module implements the general logic in a very versatile way TreatmentExpansionMixin) from .inference import BootstrapInference from .utilities import (_deprecate_positional, check_input_arrays, - cross_product, filter_none_kwargs, single_strata_from_discrete_arrays, + cross_product, filter_none_kwargs, strata_from_discrete_arrays, inverse_onehot, jacify_featurizer, ndim, reshape, shape, transpose) from .sklearn_extensions.model_selection import ModelSelector @@ -636,7 +636,7 @@ def _strata(self, Y, T, X=None, W=None, Z=None, if self.discrete_instrument: arrs.append(Z) - return single_strata_from_discrete_arrays(arrs) + return strata_from_discrete_arrays(arrs) def _prefit(self, Y, T, *args, only_final=False, **kwargs): @@ -721,7 +721,7 @@ def fit(self, Y, T, *, X=None, W=None, Z=None, sample_weight=None, freq_weight=N f"Only one outcome variable is supported when discrete_outcome=True. Got Y of shape {Y.shape}") if len(self.outcome_transformer.classes_) > 2: raise AttributeError( - f"({self.outcome_transformer.classes_} outcome classes detected. \ + f"({len(self.outcome_transformer.classes_)} outcome classes detected. \ Currently, only 2 outcome classes are allowed when discrete_outcome=True. \ Classes provided include {self.outcome_transformer.classes_[:5]}") else: diff --git a/econml/tests/test_utilities.py b/econml/tests/test_utilities.py index b80fb2c8b..518da03a5 100644 --- a/econml/tests/test_utilities.py +++ b/econml/tests/test_utilities.py @@ -10,7 +10,7 @@ import pytest from econml.utilities import (einsum_sparse, todense, tocoo, transpose, inverse_onehot, cross_product, transpose_dictionary, deprecated, _deprecate_positional, - single_strata_from_discrete_arrays) + strata_from_discrete_arrays) from sklearn.preprocessing import OneHotEncoder @@ -184,7 +184,7 @@ def test_single_strata_from_discrete_array(self): Z = np.repeat([[0, 1]], 6, axis=0).ravel() Y = np.repeat([0, 1], 6, axis=0) - assert set(single_strata_from_discrete_arrays([T, Z, Y])) == set(np.arange(12)) - assert set(single_strata_from_discrete_arrays([T, Z])) == set(np.arange(6)) - assert set(single_strata_from_discrete_arrays([T])) == set(np.arange(3)) - assert single_strata_from_discrete_arrays([]) is None + assert set(strata_from_discrete_arrays([T, Z, Y])) == set(np.arange(12)) + assert set(strata_from_discrete_arrays([T, Z])) == set(np.arange(6)) + assert set(strata_from_discrete_arrays([T])) == set(np.arange(3)) + assert strata_from_discrete_arrays([]) is None diff --git a/econml/utilities.py b/econml/utilities.py index db3f4cb49..fc577954a 100644 --- a/econml/utilities.py +++ b/econml/utilities.py @@ -1484,7 +1484,7 @@ def jacify_featurizer(featurizer): return _TransformerWrapper(featurizer) -def single_strata_from_discrete_arrays(arrs): +def strata_from_discrete_arrays(arrs): """ Combine multiple discrete arrays into a single array for stratification purposes: From 5014d4c82e8d9d5c0561fba4518c45f3ea18a4e7 Mon Sep 17 00:00:00 2001 From: Fabio Vera Date: Thu, 11 Jan 2024 13:50:27 -0500 Subject: [PATCH 24/25] add test for discrete model constraints, fix warning whitespace Signed-off-by: Fabio Vera --- econml/_ortho_learner.py | 6 +-- econml/dr/_drlearner.py | 11 +++-- econml/sklearn_extensions/model_selection.py | 9 +++- econml/tests/test_discrete_outcome.py | 43 ++++++++++++++++++++ econml/utilities.py | 2 +- 5 files changed, 61 insertions(+), 10 deletions(-) diff --git a/econml/_ortho_learner.py b/econml/_ortho_learner.py index 9a53f1f70..9423617c2 100644 --- a/econml/_ortho_learner.py +++ b/econml/_ortho_learner.py @@ -721,9 +721,9 @@ def fit(self, Y, T, *, X=None, W=None, Z=None, sample_weight=None, freq_weight=N f"Only one outcome variable is supported when discrete_outcome=True. Got Y of shape {Y.shape}") if len(self.outcome_transformer.classes_) > 2: raise AttributeError( - f"({len(self.outcome_transformer.classes_)} outcome classes detected. \ - Currently, only 2 outcome classes are allowed when discrete_outcome=True. \ - Classes provided include {self.outcome_transformer.classes_[:5]}") + f"({len(self.outcome_transformer.classes_)} outcome classes detected. " + "Currently, only 2 outcome classes are allowed when discrete_outcome=True. " + f"Classes provided include {self.outcome_transformer.classes_[:5]}") else: self.outcome_transformer = None diff --git a/econml/dr/_drlearner.py b/econml/dr/_drlearner.py index b08883f3b..ed10378f8 100644 --- a/econml/dr/_drlearner.py +++ b/econml/dr/_drlearner.py @@ -103,12 +103,15 @@ def predict(self, Y, T, X=None, W=None, *, sample_weight=None, groups=None): n = T.shape[0] Y_pred = np.zeros((T.shape[0], T.shape[1] + 1)) T_counter = np.zeros(T.shape) - if self._discrete_outcome and hasattr(self._model_regression, 'predict_proba'): - Y_pred[:, 0] = self._model_regression.predict_proba(np.hstack([XW, T_counter]))[:, 1].reshape(n) + if hasattr(self._model_regression, 'predict_proba'): + if self._discrete_outcome: + Y_pred[:, 0] = self._model_regression.predict_proba(np.hstack([XW, T_counter]))[:, 1].reshape(n) + else: + raise AttributeError("Cannot use a classifier for model_regression when discrete_outcome=False!") else: if self._discrete_outcome: - warn("A regressor was passed when discrete_outcome=True. \ - Using a classifier is recommended.", UserWarning) + warn("A regressor was passed to model_regression when discrete_outcome=True. " + "Using a classifier is recommended.", UserWarning) Y_pred[:, 0] = self._model_regression.predict(np.hstack([XW, T_counter])).reshape(n) Y_pred[:, 0] += (Y.reshape(n) - Y_pred[:, 0]) * np.all(T == 0, axis=1) / propensities[:, 0] for t in np.arange(T.shape[1]): diff --git a/econml/sklearn_extensions/model_selection.py b/econml/sklearn_extensions/model_selection.py index 4b1456d51..dda389eaf 100644 --- a/econml/sklearn_extensions/model_selection.py +++ b/econml/sklearn_extensions/model_selection.py @@ -318,8 +318,13 @@ def best_score(self): def predict(self, *args, **kwargs): return self.best_model.predict(*args, **kwargs) - def predict_proba(self, *args, **kwargs): - return self.best_model.predict_proba(*args, **kwargs) + # only expose predict_proba if best_model has predict_proba + # used because logic elsewhere uses hasattr predict proba to check if model is a classifier + def __getattr__(self, name): + if name == 'predict_proba': + return getattr(self.best_model, name) + else: + self.__getattribute__(name) def score(self, *args, **kwargs): if hasattr(self.best_model, 'score'): diff --git a/econml/tests/test_discrete_outcome.py b/econml/tests/test_discrete_outcome.py index b8e650478..da670f44f 100644 --- a/econml/tests/test_discrete_outcome.py +++ b/econml/tests/test_discrete_outcome.py @@ -180,3 +180,46 @@ def gen_array(n, is_binary, d): 'predict_proba' ) ), 'Auto outcome model is not a classifier!' + + def test_constraints(self): + """ + Confirm errors/warnings when discreteness is not handled correctly for + discrete outcomes and treatments + """ + X = np.random.normal(size=(100, 3)) + Y = np.random.choice([0, 1], size=(100)) + T = np.random.choice([0, 1], size=(100, 1)) + + ests = [ + LinearDML() + ] + + for est in ests: + with self.subTest(est=est, kind='discrete treatment'): + est.discrete_treatment = False + est.model_t = LogisticRegression() + with pytest.raises(AttributeError): + est.fit(Y=Y, T=T, X=X) + est.discrete_treatment = True + est.model_t = LinearRegression() + with pytest.warns(UserWarning): + est.fit(Y=Y, T=T, X=X) + + ests += [LinearDRLearner()] + for est in ests: + print(est) + with self.subTest(est=est, kind='discrete outcome'): + est.discrete_outcome = False + if isinstance(est, LinearDRLearner): + est.model_regression = LogisticRegression() + else: + est.model_y = LogisticRegression() + with pytest.raises(AttributeError): + est.fit(Y=Y, T=T, X=X) + est.discrete_outcome = True + if isinstance(est, LinearDRLearner): + est.model_regression = LinearRegression() + else: + est.model_y = LinearRegression() + with pytest.warns(UserWarning): + est.fit(Y=Y, T=T, X=X) diff --git a/econml/utilities.py b/econml/utilities.py index fc577954a..8e9bc8fa5 100644 --- a/econml/utilities.py +++ b/econml/utilities.py @@ -587,7 +587,7 @@ def check_input_arrays(*args, validate_len=True, force_all_finite=True, dtype=No try: assert_all_finite(new_arg) except ValueError: - warnings.warn("Input contains NaN. Causal identification strategy can be" + warnings.warn("Input contains NaN. Causal identification strategy can be erroneous" " in the presence of missing values.") if validate_len: From 74842eb961a3e05caa06d284b3601470f39a2256 Mon Sep 17 00:00:00 2001 From: Fabio Vera Date: Thu, 11 Jan 2024 15:23:03 -0500 Subject: [PATCH 25/25] fix test Signed-off-by: Fabio Vera --- econml/tests/test_federated_learning.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/econml/tests/test_federated_learning.py b/econml/tests/test_federated_learning.py index 27f656945..9c7c5804c 100644 --- a/econml/tests/test_federated_learning.py +++ b/econml/tests/test_federated_learning.py @@ -70,7 +70,7 @@ def test_lineardrlearner(self): b = np.random.normal(size=(n_x + n_w + n_t - 1)) t_model = FunctionClassifier(lambda XW: np.exp(XW @ a)) - y_model = FunctionClassifier(lambda XW: XW @ b) + y_model = FunctionRegressor(lambda XW: XW @ b) for cov_type in ['HC0', 'HC1', 'nonrobust']: with self.subTest(n_t=n_t, cov_type=cov_type):