features = ['AveOccup', 'HouseAge', ('AveOccup', 'HouseAge')]

tic = time()
_, ax = plt.subplots(ncols=3, figsize=(9, 4))
display = PPD(
    est, X_train, 
    features, kind='average', 
    n_jobs=3, grid_resolution=20,
    ax=ax)

print(f"done in {time() - tic:.3f}s")
display.figure_.suptitle(
    'PD, house value on non-location features\n'
    'California housing, Gradient Boosting')

display.figure_.subplots_adjust(wspace=0.4, hspace=0.3)

done in 1.018s


import numpy as np
from mpl_toolkits.mplot3d import Axes3D
fig = plt.figure()

features = ('AveOccup', 'HouseAge')
pdp = PD(est, X_train, 
         features=features, 
         kind='average', grid_resolution=20)

XX, YY = np.meshgrid(pdp["values"][0], 
                     pdp["values"][1])
Z = pdp.average[0].T
ax = Axes3D(fig)
surf = ax.plot_surface(XX, YY, Z, rstride=1, cstride=1,
                       cmap=plt.cm.BuPu, edgecolor='k')

ax.set_xlabel(features[0])
ax.set_ylabel(features[1])
ax.set_zlabel('Partial dependence')
# pretty init view
ax.view_init(elev=22, azim=122)
plt.colorbar(surf)
plt.suptitle('PD, house value on median\n'
             'age and avg occupancy, with Gradient Boosting')
plt.subplots_adjust(top=0.9)


from sklearn.datasets import make_hastie_10_2
from sklearn.ensemble import GradientBoostingClassifier
from sklearn.inspection import plot_partial_dependence

X, y = make_hastie_10_2(random_state=0)

clf = GradientBoostingClassifier(n_estimators=100, learning_rate=1.0,
    max_depth=1, random_state=0).fit(X, y)

features = [0, 1]
PPD(clf, X, features, kind='individual') 
PPD(clf, X, features, kind='both')

<sklearn.inspection._plot.partial_dependence.PartialDependenceDisplay at 0x7f875a87d8b0>


import pandas as pd
from sklearn.datasets import fetch_california_housing
from sklearn.model_selection import train_test_split as TTS

# center the targets to avoid gradient boosting init bias
# (gradient boosting with "recursion" doesn't account for
# the initial estimator (here the avg target, by default.)

cal_housing = fetch_california_housing()
X = pd.DataFrame(cal_housing.data, 
                 columns=cal_housing.feature_names)
y = cal_housing.target
y -= y.mean()

X_train, X_test, y_train, y_test = TTS(
    X, y, test_size=0.1, random_state=0)


# 1-way PD using a multilayer perceptron (MLP) 
# and gradient boosting

from time import time
from sklearn.pipeline import make_pipeline
from sklearn.preprocessing import QuantileTransformer as QT
from sklearn.neural_network import MLPRegressor as MLPR

print("Training MLPRegressor...")
tic = time()
est = make_pipeline(QT(),
                    MLPR(hidden_layer_sizes=(50, 50),
                         learning_rate_init=0.01,
                         early_stopping=True)).fit(X_train, 
                                                   y_train)
print(f"done in {time() - tic:.3f}s")
print(f"Test R2 score: {est.score(X_test, y_test):.2f}")

Training MLPRegressor...
done in 5.251s
Test R2 score: 0.80


import matplotlib.pyplot as plt
from sklearn.inspection import partial_dependence as PD
from sklearn.inspection import plot_partial_dependence as PPD

tic = time()
features = ['MedInc', 'AveOccup', 'HouseAge', 'AveRooms']

display = PPD(
    est, X_train, features, 
    kind="both", subsample=50,
    n_jobs=3, grid_resolution=20, random_state=0)

print(f"done in {time() - tic:.3f}s")
display.figure_.suptitle(
    'PD of house value on non-location features\n'
    'Cal Housing, with MLPRegressor'
)
display.figure_.subplots_adjust(hspace=0.3)

done in 3.154s


from sklearn.experimental import enable_hist_gradient_boosting  # noqa
from sklearn.ensemble import HistGradientBoostingRegressor as HGBR

tic = time()
est = HGBR().fit(X_train, y_train)
print(f"done in {time() - tic:.3f}s")
print(f"Test R2 score: {est.score(X_test, y_test):.2f}")

done in 0.565s
Test R2 score: 0.85


tic = time()
display = PPD(
    est, X_train, features, kind="both", subsample=50,
    n_jobs=3, grid_resolution=20, random_state=0
)
print(f"done in {time() - tic:.3f}s")
display.figure_.suptitle(
    'PD of house value on non-location features\n'
    'Cal Housing, with Gradient Boosting'
)
display.figure_.subplots_adjust(wspace=0.4, hspace=0.3)

done in 2.210s

Partial Dependence Plot (PDP)¶

PDPs - 2D interactions ¶

PDPs - 3D interactions ¶

Individual Conditional Expectation (ICE) Plot ¶

Example: PDP & ICE plots, Cal Housing dataset ¶

PDP & ICE Plot Observations:¶

Computation¶

Partial Dependence Plot (PDP)¶

PDPs - 2D interactions¶

PDPs - 3D interactions¶

Individual Conditional Expectation (ICE) Plot¶

Example: PDP & ICE plots, Cal Housing dataset¶

PDP & ICE Plot Observations:¶

Computation¶

PDPs - 2D interactions ¶

PDPs - 3D interactions ¶

Individual Conditional Expectation (ICE) Plot ¶

Example: PDP & ICE plots, Cal Housing dataset ¶