-
Notifications
You must be signed in to change notification settings - Fork 93
/
GLMTransformedOutcome.py
36 lines (29 loc) · 1.61 KB
/
GLMTransformedOutcome.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
"""GLM for uplift modeling"""
"""Modified version of Driverless AI's internal GLM implementation with transformed outcome transformation.
See e.g. https://pylift.readthedocs.io/en/latest/introduction.html#the-transformed-outcome for more information.
This recipe is intended to be used for creating binary classification uplift models using the transformed outcome approach.
You need to use one of the transformed outcome uplift models along with the AUUC scorer. The `treatment` column is passed
as a `weight` and the Driverless' task needs to be _regression_ (since after the transformation the target variable
becomes the uplift directly).
"""
from h2oaicore.models import BaseCustomModel, GLMModel
import numpy as np
import datatable as dt
class GLMTransformedOutcome(BaseCustomModel, GLMModel):
_regression = True
_binary = False
_multiclass = False
_mojo = True
_is_reproducible = False # might not reproduce identically on GPUs
_testing_can_skip_failure = False # ensure tested as if shouldn't fail
_description = "Transformed Outcome Uplift Estimator based on GLM"
_display_name = "GLMTO"
def fit(self, X: dt.Frame, y: np.array, sample_weight: np.array = None,
eval_set=None, sample_weight_eval_set=None, **kwargs):
if sample_weight is not None:
treatment_policy = np.mean(sample_weight) # weights are carrying the treatment
y = y * ((sample_weight - treatment_policy) / (treatment_policy * (1 - treatment_policy)))
return super().fit(X, y, None, eval_set, None, **kwargs)
@staticmethod
def do_acceptance_test():
return False