Add BaseDRClassifier for binary classification with probabilities

jeongyoonlee · claude · jeongyoonlee · commit 2d112cda7275 · 2025-07-15T15:26:03.000-07:00
Implements BaseDRClassifier class to address issue #819 by providing a DR-learner that outputs probabilities for binary classification problems, similar to other S/T/X learner classifiers. Key features: - Uses predict_proba() for outcome models to return probabilities - Maintains doubly robust estimation framework - Supports both single learner and separate outcome/effect learners - Includes comprehensive tests with classification data - Follows existing classifier implementation patterns Fixes #819 🤖 Generated with [Claude Code](https://claude.ai/code) Co-Authored-By: Claude <noreply@anthropic.com>
diff --git a/causalml/inference/meta/__init__.py b/causalml/inference/meta/__init__.py
@@ -9,4 +9,4 @@
 from .xlearner import BaseXLearner, BaseXRegressor, BaseXClassifier
 from .rlearner import BaseRLearner, BaseRRegressor, BaseRClassifier, XGBRRegressor
 from .tmle import TMLELearner
-from .drlearner import BaseDRLearner, BaseDRRegressor, XGBDRRegressor
+from .drlearner import BaseDRLearner, BaseDRRegressor, BaseDRClassifier, XGBDRRegressor
diff --git a/causalml/inference/meta/drlearner.py b/causalml/inference/meta/drlearner.py
@@ -13,7 +13,7 @@
     check_p_conditions,
     convert_pd_to_np,
 )
-from causalml.metrics import regression_metrics
+from causalml.metrics import regression_metrics, classification_metrics
 from causalml.propensity import compute_propensity_score
 
 
@@ -487,6 +487,92 @@ def __init__(
         )
 
 
+class BaseDRClassifier(BaseDRLearner):
+    """
+    A parent class for DR-learner classifier classes.
+    """
+
+    def __init__(
+        self,
+        learner=None,
+        control_outcome_learner=None,
+        treatment_outcome_learner=None,
+        treatment_effect_learner=None,
+        ate_alpha=0.05,
+        control_name=0,
+    ):
+        """Initialize a DR-learner classifier.
+
+        Args:
+            learner (optional): a model to estimate outcomes and treatment effects in both the control and treatment
+                groups. Should have a predict_proba() method for outcome models.
+            control_outcome_learner (optional): a model to estimate outcomes in the control group.
+                Should have a predict_proba() method.
+            treatment_outcome_learner (optional): a model to estimate outcomes in the treatment group.
+                Should have a predict_proba() method.
+            treatment_effect_learner (optional): a model to estimate treatment effects in the treatment group.
+                Should be a regressor.
+            ate_alpha (float, optional): the confidence level alpha of the ATE estimate
+            control_name (str or int, optional): name of control group
+        """
+        super().__init__(
+            learner=learner,
+            control_outcome_learner=control_outcome_learner,
+            treatment_outcome_learner=treatment_outcome_learner,
+            treatment_effect_learner=treatment_effect_learner,
+            ate_alpha=ate_alpha,
+            control_name=control_name,
+        )
+
+    def predict(
+        self, X, treatment=None, y=None, p=None, return_components=False, verbose=True
+    ):
+        """Predict treatment effects.
+
+        Args:
+            X (np.matrix or np.array or pd.Dataframe): a feature matrix
+            treatment (np.array or pd.Series, optional): a treatment vector
+            y (np.array or pd.Series, optional): an outcome vector
+            verbose (bool, optional): whether to output progress logs
+        Returns:
+            (numpy.ndarray): Predictions of treatment effects.
+        """
+        X, treatment, y = convert_pd_to_np(X, treatment, y)
+
+        te = np.zeros((X.shape[0], self.t_groups.shape[0]))
+        yhat_cs = {}
+        yhat_ts = {}
+
+        for i, group in enumerate(self.t_groups):
+            models_tau = self.models_tau[group]
+            _te = np.r_[[model.predict(X) for model in models_tau]].mean(axis=0)
+            te[:, i] = np.ravel(_te)
+            yhat_cs[group] = np.r_[
+                [model.predict_proba(X)[:, 1] for model in self.models_mu_c]
+            ].mean(axis=0)
+            yhat_ts[group] = np.r_[
+                [model.predict_proba(X)[:, 1] for model in self.models_mu_t[group]]
+            ].mean(axis=0)
+
+            if (y is not None) and (treatment is not None) and verbose:
+                mask = (treatment == group) | (treatment == self.control_name)
+                treatment_filt = treatment[mask]
+                y_filt = y[mask]
+                w = (treatment_filt == group).astype(int)
+
+                yhat = np.zeros_like(y_filt, dtype=float)
+                yhat[w == 0] = yhat_cs[group][mask][w == 0]
+                yhat[w == 1] = yhat_ts[group][mask][w == 1]
+
+                logger.info("Error metrics for group {}".format(group))
+                classification_metrics(y_filt, yhat, w)
+
+        if not return_components:
+            return te
+        else:
+            return te, yhat_cs, yhat_ts
+
+
 class XGBDRRegressor(BaseDRRegressor):
     def __init__(self, ate_alpha=0.05, control_name=0, *args, **kwargs):
         """Initialize a DR-learner with two XGBoost models."""
diff --git a/tests/test_meta_learners.py b/tests/test_meta_learners.py
@@ -30,7 +30,7 @@
     XGBRRegressor,
 )
 from causalml.inference.meta import TMLELearner
-from causalml.inference.meta import BaseDRLearner
+from causalml.inference.meta import BaseDRLearner, BaseDRRegressor, BaseDRClassifier
 from causalml.metrics import ape, auuc_score
 
 from .const import RANDOM_SEED, N_SAMPLE, ERROR_THRESHOLD, CONTROL_NAME, CONVERSION
@@ -1039,3 +1039,51 @@ def test_BaseDRLearner(generate_regression_data):
         normalize=True,
     )
     assert auuc["cate_p"] > 0.5
+
+
+
+def test_BaseDRClassifier(generate_classification_data):
+    np.random.seed(RANDOM_SEED)
+
+    df, X_names = generate_classification_data()
+
+    df["treatment_group_key"] = np.where(
+        df["treatment_group_key"] == CONTROL_NAME, 0, 1
+    )
+    
+    # Extract features and outcome
+    y = df[CONVERSION].values
+    X = df[X_names].values
+    treatment = df["treatment_group_key"].values
+
+    learner = BaseDRClassifier(
+        learner=LogisticRegression(),
+        treatment_effect_learner=LinearRegression()
+    )
+
+    # Test fit and predict
+    te = learner.fit_predict(X=X, treatment=treatment, y=y)
+    
+    # Check that treatment effects are returned
+    assert te.shape[0] == X.shape[0]
+    assert te.shape[1] == len(np.unique(treatment[treatment != 0]))
+    
+    # Test with return_components
+    te, yhat_cs, yhat_ts = learner.fit_predict(
+        X=X, treatment=treatment, y=y, return_components=True
+    )
+    
+    # Check that components are returned as probabilities
+    for group in learner.t_groups:
+        assert np.all((yhat_cs[group] >= 0) & (yhat_cs[group] <= 1))
+        assert np.all((yhat_ts[group] >= 0) & (yhat_ts[group] <= 1))
+    
+    # Test separate outcome and effect learners
+    learner_separate = BaseDRClassifier(
+        control_outcome_learner=LogisticRegression(),
+        treatment_outcome_learner=LogisticRegression(),
+        treatment_effect_learner=LinearRegression()
+    )
+    
+    te_separate = learner_separate.fit_predict(X=X, treatment=treatment, y=y)
+    assert te_separate.shape == te.shape