TODO:

implement Algorithm 1
apply it to the example from here
use shap to reproduce the manually calculated outputs

In [1]:

import itertools
import pickle
import math

import numpy as np
import pandas as pd
import shap
import matplotlib.pyplot as plt
from sklearn.tree import DecisionTreeRegressor, plot_tree

In [2]:

# for auto-reloading external modules
# see http://stackoverflow.com/questions/1907993/autoreload-of-modules-in-ipython
get_ipython().magic("load_ext autoreload")
get_ipython().magic("autoreload 2")

In [3]:

with open('./tree_model.pkl', 'rb') as opened:
    tree_model = pickle.load(opened)

Trying to unpickle estimator DecisionTreeRegressor from version 1.0.1 when using version 0.23.2. This might lead to breaking code or invalid results. Use at your own risk.

In [4]:

tree_model

From version 0.24, get_params will raise an AttributeError if a parameter cannot be retrieved as an instance attribute. Previously it would return None.

Out[4]:

DecisionTreeRegressor(criterion='mae', max_depth=2, presort=None,
                      random_state=100)

In [5]:

tree = tree_model.tree_

In [6]:

import tree_shap

In [7]:

tree.predict(np.array([[150, 75, 200]], dtype=np.float32))

Out[7]:

array([[20.]])

In [8]:

x = [150, 75, 200]

In [10]:

assert tree_shap.exp_value(x, S={}, tree=tree) == 23
assert tree_shap.exp_value(x, S={0}, tree=tree) == 20
assert tree_shap.exp_value(x, S={1}, tree=tree) == 27
assert tree_shap.exp_value(x, S={0, 1}, tree=tree) == 20

In [ ]:

x2 = np.array([100, 25, 400])

In [10]:

shap.TreeExplainer?

In [11]:

explainer = shap.TreeExplainer(tree_model)
explainer.shap_values(x2)

---------------------------------------------------------------------------
NameError                                 Traceback (most recent call last)
<ipython-input-11-7ef351b65faf> in <module>
      1 explainer = shap.TreeExplainer(tree_model)
----> 2 explainer.shap_values(x2)

NameError: name 'x2' is not defined

In [12]:

x = x2

---------------------------------------------------------------------------
NameError                                 Traceback (most recent call last)
<ipython-input-12-cb64638f1b76> in <module>
----> 1 x = x2

NameError: name 'x2' is not defined

In [57]:

# ϕ0 = tree_shap.exp_value(x, {}, tree)

# ϕs = []
preds = {}
for card in range(0, len(x) + 1):
    for perm in itertools.permutations(range(len(x)), r=card):
        preds[tuple(perm)] = tree_shap.exp_value(x, S=set(perm), tree=tree)

In [58]:

preds

Out[58]:

{(): 23.0,
 (0,): 40.0,
 (1,): 27.0,
 (2,): 23.0,
 (0, 1): 50.0,
 (0, 2): 40.0,
 (1, 0): 50.0,
 (1, 2): 27.0,
 (2, 0): 40.0,
 (2, 1): 27.0,
 (0, 1, 2): 50.0,
 (0, 2, 1): 50.0,
 (1, 0, 2): 50.0,
 (1, 2, 0): 50.0,
 (2, 0, 1): 50.0,
 (2, 1, 0): 50.0}

In [59]:

deltas = [0] * len(x)
for perm in itertools.permutations(range(len(x)), r=len(x)):
    for index, i in enumerate(perm):
        deltas[i] += preds[perm[:index+1]] - preds[perm[:index]]

In [60]:

np.array(deltas) / math.factorial(len(x))

Out[60]:

array([20.,  7.,  0.])

In [ ]:

In [40]:

ϕ0 = preds[()]
ϕs = []
for i in range(len(x)):
    delta = 0
    for key in preds:
        if i in key:
            delta += preds[key] - preds[tuple(_ for _ in key if _ != i)]
#     ϕs.append(delta / math.factorial(len(x)))
    ϕs.append(delta)

In [41]:

ϕ0

Out[41]:

23.0

In [42]:

ϕs

Out[42]:

[-65.0, 12.0, 0.0]

In [ ]:

In [11]:

features_tuple = ((0, 150), (1, 75), (2, 200))

In [17]:

# follows the calculation at https://medium.com/analytics-vidhya/shap-part-3-tree-shap-3af9bcd7cd9b closely

basis = tree_shap.exp_value(x, {}, tree)

all_phis = []
for perm in itertools.permutations(features_tuple):
    phis = {"basis": basis}
    for i in range(len(perm)):
        phi_raw = tree_shap.exp_value(x, S={_[0] for _ in perm[: i + 1]}, tree=tree)
        phi = phi_raw - sum(phis.values())
        phis[perm[i][0]] = phi
    all_phis.append(phis)

In [18]:

perm

Out[18]:

((2, 200), (1, 75), (0, 150))

In [19]:

{_[0] for _ in perm}

Out[19]:

{0, 1, 2}

In [20]:

all_phis

Out[20]:

[{'basis': 23.0, 0: -3.0, 1: 0.0, 2: 0.0},
 {'basis': 23.0, 0: -3.0, 2: 0.0, 1: 0.0},
 {'basis': 23.0, 1: 4.0, 0: -7.0, 2: 0.0},
 {'basis': 23.0, 1: 4.0, 2: 0.0, 0: -7.0},
 {'basis': 23.0, 2: 0.0, 0: -3.0, 1: 0.0},
 {'basis': 23.0, 2: 0.0, 1: 4.0, 0: -7.0}]

In [21]:

pd.DataFrame(all_phis)

Out[21]:

	basis	0	1
0	23.0	-3.0	0.0
1	23.0	-3.0	0.0
2	23.0	-7.0	4.0
3	23.0	-7.0	4.0
4	23.0	-3.0	0.0
5	23.0	-7.0	4.0

In [22]:

pd.DataFrame(all_phis).mean()

Out[22]:

basis    23.0
0        -5.0
1         2.0
2         0.0
dtype: float64

In [ ]:

In [33]:

math.factorial(3)

Out[33]:

In [41]:

preds = {}

for card in range(len(x) + 1):  # cardinality of S
    for perm in itertools.permutations(range(len(x)), r=card):
        S = set(perm)
        preds[S] = tree_shap.exp_value(x, S, tree)

---------------------------------------------------------------------------
TypeError                                 Traceback (most recent call last)
<ipython-input-41-181e585d6128> in <module>
      4     for perm in itertools.permutations(range(len(x)), r=card):
      5         S = set(perm)
----> 6         preds[S] = tree_shap.exp_value(x, S, tree)

TypeError: unhashable type: 'set'

In [58]:

pd.DataFrame(all_phis).mean(axis=0)

Out[58]:

basis    23.0
0        -1.0
1        -1.0
2        -1.0
dtype: float64

In [ ]:

all_phis = []
for permutation in itertools.permutations(features_tuple):
    phis = {'basis': basis}
    for i in range(len(permutation)):
        phi_raw = tree_shap.naive_tree_shap(tree, current_node=0, features=dict(permutation[:i + 1]))
        phi = phi_raw - sum(phis.values())
        phis[permutation[i][0]] = phi
    all_phis.append(phis)

In [48]:

pd.DataFrame(all_phis).mean(axis=0)

Out[48]:

basis    23.0
0        -5.0
1         2.0
2         0.0
dtype: float64

In [ ]:

In [25]:

tree_shap.exp_value(x, S={1, 2}, tree=tree)

Out[25]:

27.0

In [8]:

tree_shap.naive_tree_shap(
    tree,
    current_node=0,
    features={0: 150},
)

Out[8]:

20.0

In [9]:

assert (
    tree_shap.naive_tree_shap(
        tree,
        current_node=0,
        features={0: 150},
    )
    == 20
)
assert (
    tree_shap.naive_tree_shap(
        tree,
        current_node=0,
        features={1: 75},
    )
    == 27
)

# given feature 0, having feature 1 doesn't make a difference
assert (
    tree_shap.naive_tree_shap(
        tree,
        current_node=0,
        features={0: 150, 1: 75},
    )
    == 20
)

In [ ]:

In [20]:

X_test = pd.DataFrame(
    {
        "x0": [150],
        "x1": [75],
        "x2": [200],
    }
)

In [68]:

tree.n_node_samples

Out[68]:

array([10,  4,  2,  2,  6,  1,  5], dtype=int64)

In [63]:

tree.children_left

Out[63]:

array([ 1,  2, -1, -1,  5, -1, -1], dtype=int64)

In [70]:

tree.children_right

Out[70]:

array([ 4,  3, -1, -1,  6, -1, -1], dtype=int64)

In [67]:

tree.feature

Out[67]:

array([ 0,  1, -2, -2,  0, -2, -2], dtype=int64)

In [72]:

tree.threshold

Out[72]:

array([100., 300.,  -2.,  -2., 200.,  -2.,  -2.])

In [21]:

tree_model.predict(X_test)

Out[21]:

array([20.])

In [47]:

import sklearn.tree

In [51]:

tree.value?

In [50]:

tree.value.shape

Out[50]:

(7, 1, 1)

In [57]:

tree.value

Out[57]:

array([[[15.]],

       [[40.]],

       [[50.]],

       [[30.]],

       [[10.]],

       [[20.]],

       [[10.]]])

In [60]:

tree.n_node_samples

Out[60]:

array([10,  4,  2,  2,  6,  1,  5], dtype=int64)

In [ ]:

In [29]:

tree.n_outputs

Out[29]:

In [32]:

tree_model.feature_names_in_

Out[32]:

array(['x0', 'x1', 'x2'], dtype=object)

In [33]:

tree_model.tree_.feature

Out[33]:

array([ 0,  1, -2, -2,  0, -2, -2], dtype=int64)

In [28]:

tree.max_n_classes

Out[28]:

In [45]:

tree_model.max_features_

Out[45]:

In [43]:

tree.predict(np.array([[150, 75, 200]], dtype=np.float32))

Out[43]:

array([[20.]])

In [14]:

tree.children_left?

In [12]:

tree.feature

Out[12]:

array([ 0,  1, -2, -2,  0, -2, -2], dtype=int64)

In [7]:

tree.node_count

Out[7]:

In [8]:

import tree_shap

In [9]:

assert (
    tree_shap.naive_tree_shap(
        tree,
        current_node=0,
        features={0: 150},
    )
    == 20
)
assert (
    tree_shap.naive_tree_shap(
        tree,
        current_node=0,
        features={1: 75},
    )
    == 27
)

# given feature 0, having feature 1 doesn't make a difference
assert (
    tree_shap.naive_tree_shap(
        tree,
        current_node=0,
        features={0: 150, 1: 75},
    )
    == 20
)

In [10]:

import itertools

In [13]:

features_tuple = ((0, 150), (1, 75), (2, 200))

Need to rename the variables here to make it more readable

In [44]:

all_phis = []
for permutation in itertools.permutations(features_tuple):
    phis = {'basis': basis}
    for i in range(len(permutation)):
        phi_raw = tree_shap.naive_tree_shap(tree, current_node=0, features=dict(permutation[:i + 1]))
        phi = phi_raw - sum(phis.values())
        phis[permutation[i][0]] = phi
    all_phis.append(phis)

In [45]:

all_phis

Out[45]:

[{'basis': 23.0, 0: -3.0, 1: 0.0, 2: 0.0}, {'basis': 23.0, 0: -3.0, 2: 0.0, 1: 0.0}, {'basis': 23.0, 1: 4.0, 0: -7.0, 2: 0.0}, {'basis': 23.0, 1: 4.0, 2: 0.0, 0: -7.0}, {'basis': 23.0, 2: 0.0, 0: -3.0, 1: 0.0}, {'basis': 23.0, 2: 0.0, 1: 4.0, 0: -7.0}]

In [48]:

pd.DataFrame(all_phis).mean(axis=0)

Out[48]:

basis    23.0
0        -5.0
1         2.0
2         0.0
dtype: float64

In [36]:

from collections import OrderedDict

In [43]:

OrderedDict(features_tuple)[:2]

---------------------------------------------------------------------------
TypeError                                 Traceback (most recent call last)
<ipython-input-43-dafde3bde0d2> in <module>
----> 1 OrderedDict(features_tuple)[:2]

TypeError: unhashable type: 'slice'

In [38]:

list(itertools.permutations(OrderedDict(features_tuple)))

Out[38]:

[(0, 1, 2), (0, 2, 1), (1, 0, 2), (1, 2, 0), (2, 0, 1), (2, 1, 0)]

In [35]:

permutation

Out[35]:

((2, 200), (1, 75), (0, 150))

In [27]:

phis

Out[27]:

[23.0, 0.0, 4.0, -7.0]

In [28]:

permutation

Out[28]:

((2, 200), (1, 75), (0, 150))

In [34]:

np.array(all_phis)[:, 1:]

Out[34]:

array([[-3.,  0.,  0.],
       [-3.,  0.,  0.],
       [ 4., -7.,  0.],
       [ 4.,  0., -7.],
       [ 0., -3.,  0.],
       [ 0.,  4., -7.]])

In [33]:

np.array(all_phis)[:, 1:].mean(axis=0)

Out[33]:

array([ 0.33333333, -1.        , -2.33333333])

In [ ]:

In [29]:

itertools.subpermutation

Out[29]:

(0, 1, 2)

In [ ]:

In [10]:

tree.feature

Out[10]:

array([ 0,  1, -2, -2,  0, -2, -2])

In [30]:

tree.tree_.value

Out[30]:

array([[[15.]],

       [[40.]],

       [[50.]],

       [[30.]],

       [[10.]],

       [[20.]],

       [[10.]]])

In [46]:

tree.decision_path([[150, 75, 200]]).todense()

Out[46]:

matrix([[1, 0, 0, 0, 1, 1, 0]])

In [17]:

tree.tree_.children_left

Out[17]:

array([ 1,  2, -1, -1,  5, -1, -1])

In [18]:

tree.tree_.children_right

Out[18]:

array([ 4,  3, -1, -1,  6, -1, -1])

In [23]:

tree.tree_.

Out[23]:

In [24]:

tree.tree_.threshold

Out[24]:

array([100., 300.,  -2.,  -2., 200.,  -2.,  -2.])

In [ ]:

In [22]:

_ = plot_tree(tree, filled=True, proportion=False)

Explain for the example [x=150, y=75, z=200]

In [26]:

import sklearn

In [41]:

tree.tree_.threshold

Out[41]:

array([100., 300.,  -2.,  -2., 200.,  -2.,  -2.])

In [40]:

tree.tree_.feature

Out[40]:

array([ 0,  1, -2, -2,  0, -2, -2])

In [39]:

tree.tree_.children_left

Out[39]:

array([ 1,  2, -1, -1,  5, -1, -1])

In [42]:

tree.tree_.children_right

Out[42]:

array([ 4,  3, -1, -1,  6, -1, -1])

In [31]:

tree.tree_.children_left

Out[31]:

array([ 1,  2, -1, -1,  5, -1, -1])

In [47]:

from collections import OrderedDict

In [56]:

features = [[1, 75], [2, 200], [0, 150]]

In [57]:

features[:2]

Out[57]:

[[1, 75], [2, 200]]

In [58]:

tree.tree_.n_node_samples

Out[58]:

array([10,  4,  2,  2,  6,  1,  5])

In [ ]:

def decision_path(i):
    """
    i: index of features
    """
    if i == tree.tree_.feature[0]

In [ ]:

x > y > z

In [12]:

phi_x = 20 - phi_null

In [13]:

phi_y = 20 - phi_x - phi_null

In [14]:

phi_z = 20 - phi_y - phi_x - phi_null

In [15]:

phi_z

Out[15]:

0.0

y > z > x

In [16]:

phi_y = (4 / 10) * 50 + (6 / 10) * (1 / 6 * 20 + 5 / 6 * 10) - phi_null

In [17]:

phi_y

Out[17]:

4.0

In [18]:

phi_z = 0

In [19]:

phi_x = 20 - phi_y - phi_null

In [20]:

phi_x

Out[20]:

-7.0

In [ ]:

In [21]:

tree.predict([[150, 75, 200]])

Out[21]:

array([20.])

In [ ]:

In [22]:

X_test = pd.DataFrame({'x': [150], 'y': [75], 'z': [200]})

In [24]:

explainer = shap.TreeExplainer(tree)
shap_values = explainer.shap_values(X_test)
shap_values

Setting feature_perturbation = "tree_path_dependent" because no background data was given.

Out[24]:

array([[-5.,  2.,  0.]])

In [ ]: