From 22b13c2594a491317908feb54c9f3401bafd9d43 Mon Sep 17 00:00:00 2001
From: ras44 <9282281+ras44@users.noreply.github.com>
Date: Fri, 7 Feb 2025 18:26:42 +0100
Subject: [PATCH] resolves #796 remove dep on pygam, use IsotonicRegression
 (#803)

* resolves #796 remove dep on pygam, use IsotonicRegression
* restrict propensity scores to (0,1); (0+2eps,1-2eps)
* linted

---------

Co-authored-by: Roland Stevenson <rolandrmgservices@gmail.com>
---
 causalml/propensity.py | 12 +++++++-----
 1 file changed, 7 insertions(+), 5 deletions(-)

diff --git a/causalml/propensity.py b/causalml/propensity.py
index f3aee9e3..f18cf28f 100644
--- a/causalml/propensity.py
+++ b/causalml/propensity.py
@@ -1,10 +1,10 @@
 from abc import ABCMeta, abstractmethod
 import logging
 import numpy as np
-from pygam import LogisticGAM, s
 from sklearn.metrics import roc_auc_score as auc
 from sklearn.linear_model import LogisticRegressionCV
 from sklearn.model_selection import StratifiedKFold, train_test_split
+from sklearn.isotonic import IsotonicRegression
 import xgboost as xgb
 
 
@@ -179,9 +179,9 @@ def predict(self, X):
 
 
 def calibrate(ps, treatment):
-    """Calibrate propensity scores with logistic GAM.
+    """Calibrate propensity scores with IsotonicRegression.
 
-    Ref: https://pygam.readthedocs.io/en/latest/api/logisticgam.html
+    Ref: https://scikit-learn.org/stable/modules/isotonic.html
 
     Args:
         ps (numpy.array): a propensity score vector
@@ -191,9 +191,11 @@ def calibrate(ps, treatment):
         (numpy.array): a calibrated propensity score vector
     """
 
-    gam = LogisticGAM(s(0)).fit(ps, treatment)
+    two_eps = 2.0 * np.finfo(float).eps
+    pm_ir = IsotonicRegression(out_of_bounds="clip", y_min=two_eps, y_max=1.0 - two_eps)
+    ps_ir = pm_ir.fit_transform(ps, treatment)
 
-    return gam.predict_proba(ps)
+    return ps_ir
 
 
 def compute_propensity_score(