import matplotlib.pyplot as plt
import numpy as np
import numpy.random as rnd

p = 1
beta = rnd.normal(0, 1, p + 1)
sig = 0.2

beta

array([-0.63770377, -1.0142289 ])

n = 50
x = rnd.normal(0, 10, (n, p))

X = np.concatenate((np.ones((n,1)), x), axis=1)
X.shape

(50, 2)

Y = np.arctan(X.dot(beta)) + rnd.normal(0, sig, n)

n0 = 100
x_plot = np.linspace(x.min(), x.max(), n0)
pred_bayes = np.arctan(beta[0] + beta[1]*x_plot)

plt.plot(x, Y, 'o', label='data')
plt.plot(x_plot, pred_bayes, label='predict Bayes')
plt.legend()
plt.show()

from sklearn.kernel_ridge import KernelRidge

model = KernelRidge(alpha=0.06, kernel='rbf', gamma=0.01)

model.fit(x, Y)

KernelRidge(alpha=0.06, gamma=0.01, kernel='rbf')

KernelRidge(alpha=0.06, gamma=0.01, kernel='rbf')

pred = model.predict(x_plot.reshape((n0,1)))

plt.plot(x, Y, 'o', label='data')
plt.plot(x_plot, pred_bayes, label='pred Bayes')
plt.plot(x_plot, pred, label='predictions')
plt.legend()
plt.show()

from sklearn.metrics import mean_squared_error as MSE

n_estim = 20000
x_new = rnd.normal(0, 10, (n_estim, p))
X_new = np.concatenate((np.ones((n_estim,1)), x_new), axis=1)
Y_new = np.arctan(X_new.dot(beta)) + rnd.normal(0, sig, n_estim)
Y_pred = model.predict(x_new.reshape((n_estim,1)))

MSE(Y_new,Y_pred)

0.10814719322695762

m_estim = 20
n_estim = 2000
mse = 0.

for _ in range(m_estim):
    x_new = rnd.normal(0, 10, (n_estim, p))
    X_new = np.concatenate((np.ones((n_estim,1)), x_new), axis=1)
    Y_new = np.arctan(X_new.dot(beta)) + rnd.normal(0, sig, n_estim)
    model = KernelRidge(alpha=0.06, kernel='rbf', gamma=0.01)
    model.fit(x_new, Y_new)
    Y_pred = model.predict(x_new.reshape((n_estim,1)))
    mse += MSE(Y_new,Y_pred)

mse/m_estim

0.05581331855816599

n_estim = 20000
risque_alpha = []
range_alpha = np.arange(0.0001, 0.2, 0.005)

for alpha in range_alpha:
    model = KernelRidge(alpha=alpha, kernel='rbf', gamma=0.01)
    model.fit(x, Y)
    x_new = rnd.normal(0, 10, (n_estim, p))
    X_new = np.concatenate((np.ones((n_estim,1)), x_new), axis=1)
    Y_new = np.arctan(X_new.dot(beta)) + rnd.normal(0, sig, n_estim)
    Y_pred = model.predict(x_new.reshape((n_estim,1)))
    risque_alpha.append(MSE(Y_new,Y_pred))

alpha_opt = range_alpha[np.argmin(risque_alpha)]
alpha_opt

0.0051

risque_alpha[np.argmin(risque_alpha)]

0.0963244389375491

plt.plot(range_alpha, risque_alpha)
plt.show()

model = KernelRidge(alpha=0.0000001, kernel='rbf', gamma=0.01)
model.fit(x, Y)

x_plot = np.linspace(x.min(), x.max(), 100)
pred = model.predict(x_plot.reshape((-1,1)))
pred_bayes = np.arctan(beta[0] + beta[1]*x_plot)

plt.plot(x, Y, 'o', label='data', alpha=0.2)
plt.plot(x_plot, pred_bayes, label='pred Bayes')
plt.plot(x_plot, pred, label='predictions')
plt.legend()
plt.show()

model = KernelRidge(alpha=2, kernel='rbf', gamma=0.01)
model.fit(x, Y)

x_plot = np.linspace(x.min(), x.max(), 100)
pred = model.predict(x_plot.reshape((-1,1)))
pred_bayes = np.arctan(beta[0] + beta[1]*x_plot)

plt.plot(x, Y, 'o', label='data', alpha=0.2)
plt.plot(x_plot, pred_bayes, label='pred Bayes')
plt.plot(x_plot, pred, label='predictions')
plt.legend()
plt.show()

model = KernelRidge(alpha=alpha_opt, kernel='rbf', gamma=0.01)
model.fit(x, Y)

x_plot = np.linspace(x.min(), x.max(), 100)
pred = model.predict(x_plot.reshape((-1,1)))
pred_bayes = np.arctan(beta[0] + beta[1]*x_plot)

plt.plot(x, Y, 'o', label='data', alpha=0.2)
plt.plot(x_plot, pred_bayes, label='pred Bayes')
plt.plot(x_plot, pred, label='predictions')
plt.legend()
plt.show()

n = 150
x = rnd.normal(0, 10, (n, p))
X = np.concatenate((np.ones((n,1)), x), axis=1)
Y = np.arctan(X.dot(beta)) + rnd.normal(0, sig, n)

model = KernelRidge(alpha=0.06, kernel='rbf', gamma=0.01)
model.fit(x, Y)

x_plot = np.linspace(x.min(), x.max(), 100)
pred = model.predict(x_plot.reshape((-1,1)))
pred_bayes = np.arctan(beta[0] + beta[1]*x_plot)

plt.plot(x, Y, 'o', label='data', alpha=0.2)
plt.plot(x_plot, pred_bayes, label='pred Bayes')
plt.plot(x_plot, pred, label='predictions')
plt.legend()
plt.show()

n_estim = 20000
x_new = rnd.normal(0, 10, (n_estim, p))
X_new = np.concatenate((np.ones((n_estim,1)), x_new), axis=1)
Y_new = np.arctan(X_new.dot(beta)) + rnd.normal(0, sig, n_estim)
Y_pred = model.predict(x_new.reshape((n_estim,1)))

MSE(Y_new,Y_pred)

0.07029323368331582

from sklearn.model_selection import cross_val_score

model = KernelRidge(alpha=0.06, kernel='rbf', gamma=0.01)
scores = cross_val_score(model, x, Y, cv=5, scoring='neg_mean_squared_error')

-scores.mean()

0.08580735407908234

from sklearn.model_selection import GridSearchCV

parameters = {'alpha': np.arange(0.0001, 0.2, 0.005),
              'gamma': np.arange(0.0001, 0.2, 0.005)}
kr = KernelRidge(kernel='rbf')      
model = GridSearchCV(kr, parameters, cv=3, scoring='neg_mean_squared_error')

model.fit(x, Y)

GridSearchCV(cv=3, estimator=KernelRidge(kernel='rbf'),
             param_grid={'alpha': array([1.000e-04, 5.100e-03, 1.010e-02, 1.510e-02, 2.010e-02, 2.510e-02,
       3.010e-02, 3.510e-02, 4.010e-02, 4.510e-02, 5.010e-02, 5.510e-02,
       6.010e-02, 6.510e-02, 7.010e-02, 7.510e-02, 8.010e-02, 8.510e-02,
       9.010e-02, 9.510e-02, 1.001e-01, 1.051e-01, 1.101e-01, 1.151e-01,
       1.201e-01, 1.251e-01, 1.301e-01...
       3.010e-02, 3.510e-02, 4.010e-02, 4.510e-02, 5.010e-02, 5.510e-02,
       6.010e-02, 6.510e-02, 7.010e-02, 7.510e-02, 8.010e-02, 8.510e-02,
       9.010e-02, 9.510e-02, 1.001e-01, 1.051e-01, 1.101e-01, 1.151e-01,
       1.201e-01, 1.251e-01, 1.301e-01, 1.351e-01, 1.401e-01, 1.451e-01,
       1.501e-01, 1.551e-01, 1.601e-01, 1.651e-01, 1.701e-01, 1.751e-01,
       1.801e-01, 1.851e-01, 1.901e-01, 1.951e-01])},
             scoring='neg_mean_squared_error')

GridSearchCV(cv=3, estimator=KernelRidge(kernel='rbf'),
             param_grid={'alpha': array([1.000e-04, 5.100e-03, 1.010e-02, 1.510e-02, 2.010e-02, 2.510e-02,
       3.010e-02, 3.510e-02, 4.010e-02, 4.510e-02, 5.010e-02, 5.510e-02,
       6.010e-02, 6.510e-02, 7.010e-02, 7.510e-02, 8.010e-02, 8.510e-02,
       9.010e-02, 9.510e-02, 1.001e-01, 1.051e-01, 1.101e-01, 1.151e-01,
       1.201e-01, 1.251e-01, 1.301e-01...
       3.010e-02, 3.510e-02, 4.010e-02, 4.510e-02, 5.010e-02, 5.510e-02,
       6.010e-02, 6.510e-02, 7.010e-02, 7.510e-02, 8.010e-02, 8.510e-02,
       9.010e-02, 9.510e-02, 1.001e-01, 1.051e-01, 1.101e-01, 1.151e-01,
       1.201e-01, 1.251e-01, 1.301e-01, 1.351e-01, 1.401e-01, 1.451e-01,
       1.501e-01, 1.551e-01, 1.601e-01, 1.651e-01, 1.701e-01, 1.751e-01,
       1.801e-01, 1.851e-01, 1.901e-01, 1.951e-01])},
             scoring='neg_mean_squared_error')

KernelRidge(alpha=0.10010000000000001, gamma=0.0101, kernel='rbf')

KernelRidge(alpha=0.10010000000000001, gamma=0.0101, kernel='rbf')

model.best_params_

{'alpha': 0.10010000000000001, 'gamma': 0.0101}

x_plot = np.linspace(x.min(), x.max(), 100)
pred = model.predict(x_plot.reshape((-1,1)))
pred_bayes = np.arctan(beta[0] + beta[1]*x_plot)

plt.plot(x, Y, 'o', label='data', alpha=0.2)
plt.plot(x_plot, pred_bayes, label='pred Bayes')
plt.plot(x_plot, pred, label='predictions')
plt.legend()
plt.show()

err = Y-model.predict(x)

from scipy.stats import normaltest
from scipy.stats import norm

normaltest(err)

NormaltestResult(statistic=2.5079239158887283, pvalue=0.28537192258619043)

norm.fit(err)

(-0.00042547455007194184, 0.2709213153648689)

m_err, sig_err = norm.fit(err)

q = norm.ppf(1-0.05/2) # quantile de la loi N(0,1).

plt.plot(x, Y, 'o', label='data', alpha=0.2)
plt.plot(x_plot, pred_bayes, label='pred Bayes')
plt.plot(x_plot, pred, label='predictions')
plt.fill_between(x_plot, pred-sig_err*q, pred+sig_err*q, color="g", alpha=0.1, label='IC 95%')
plt.legend()
plt.show()

Evaluation numérique du risque: Illustrations¶

Définition de la loi jointe et estimation du risque de Bayes¶

Définition de la classe de modèle utilisée pour la regression¶

Minimiseur du risque empirique.¶

Risque de généralisation et risque moyen¶

Effect du paramètre de régularisation¶

Cross validation¶

Recherche des hypers paramètres¶