%matplotlib inline
import matplotlib.pyplot as plt
import numpy as np
import math, warnings
import seaborn as sns

from mpl_toolkits.mplot3d import Axes3D
from random import random
#from mpl_toolkits.mplot3d import axes3d
import matplotlib.pyplot as plt
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.linear_model import LinearRegression
from sklearn.linear_model import Lasso
from sklearn.linear_model import  Ridge
from sklearn.preprocessing import PolynomialFeatures
from sklearn.model_selection import KFold

sns.set()
warnings.filterwarnings('ignore')


np.random.seed(0)
x =  np.linspace(-5,10,num=30) #generate the X data  
y = x - 2 * (x ** 2) + 0.2 * (x ** 3)  + np.random.normal(-5, 5, size=x.size) +2 #generate target points y


x = x[:, np.newaxis]
y = y[:, np.newaxis]
plt.scatter(x,y, s=10)
plt.show()


def regression(model, x_train, y_train, x_test, y_test) :
    std = StandardScaler().fit(x_train)
    regr_type = model.fit(std.transform(x_train),y_train)
    y_predicited = regr_type.predict(std.transform(x_test))
    return y_predicited, regr_type.score(std.transform(x_train), y_train),regr_type.score(std.transform(x_test),y_test), regr_type.coef_


y_pred, score_train, score_test, coef = regression(LinearRegression(), x, y, x, y)


y_pred, score_train, score_test , coef = regression(LinearRegression(), x, y, x, y)
plt.plot(x, y_pred)  #L = 0.0028
plt.scatter(x, y, s=10, color='r')
plt.title('accuracy = {}'.format(score_train))

Text(0.5, 1.0, 'accuracy = 0.16333333102399328')


def polynomial_convert(X,degree):
    '''
    X : like array 
       dataset
    degree : int 
       number of powers
    '''
    return PolynomialFeatures(degree=degree).fit_transform(X)


x_poly = polynomial_convert(x, degree = 39)
y_pred, score_train, score_test, coef = regression(LinearRegression(), x_poly, y, x_poly, y)
plt.plot(x, y_pred)  #L = 0.0028
plt.scatter(x,y, s=10,color='r')
plt.title('accuracy = {}'.format(score_train))

Text(0.5, 1.0, 'accuracy = 0.9999507021155106')


x_poly = polynomial_convert(x, degree = 12)
y_pred, score,score_test, coef = regression( Lasso(alpha=0), x_poly, y, x_poly, y)
plt.plot(x, y_pred)  #L = 0.0028
plt.scatter(x,y, s=10,color='r')
plt.title('accuracy = {}'.format(score))

Text(0.5, 1.0, 'accuracy = 0.9338410468831142')


def calc_weights(model, alphas):
    weights = np.array([])
    for alpha in alphas:
        y_pred, score, score_test,coef = regression( model(alpha=alpha), x_poly, y, x_poly, y)
        if weights.shape[0]>0 : 
            weights = np.vstack([weights,coef])
        else :
            weights = coef
    
    return weights.T

def plot_weights(weights):
    for i in range(weights.shape[0]):
        plt.plot(np.array(alphas),(weights[i,:]),label=r'$w_{}$'.format(i))

    plt.ylabel('weight size')
    plt.xlabel(r'$\lambda$')    
    plt.legend(bbox_to_anchor=(1.05, 1), loc='upper left', borderaxespad=0)


alphas = [10e-4, 10e-3, 10e-2,10e-1,1]
weights = calc_weights(Lasso, alphas)
plot_weights(weights)


weights = np.array([])
alphas = [10e-1,1,5,7,10,20]
weights = calc_weights(Lasso, alphas)
plot_weights(weights)


 X_train, X_test, y_train, y_test = train_test_split(x_poly, y, test_size=0.33, random_state=42)


weights = np.array([])
alphas = [10e-4,10e-3,10e-2,10e-1,10,100,1000]
scores =[]
scores_test = []
print(weights.shape)
for alpha in alphas:
    y_pred, score, score_test, coef = regression( Lasso(alpha=alpha), X_train, y_train, X_test, y_test)
    scores.append(score)
    scores_test.append(score_test)
    if weights.shape[0]>0 : 
        weights = np.vstack([weights,coef])
    else :
        weights = coef
weights = weights.T

(0,)


x_label=np.linspace(0,1,len(scores))
plt.plot(x_label,scores,label='train')
plt.plot(x_label,scores_test,label='test')
plt.xlabel('alpha')
plt.ylabel('scores')
plt.xticks(x_label, np.array(alphas).astype(str))
plt.legend()

<matplotlib.legend.Legend at 0x279c951940>


scores_test

[0.9424123436147908,
 0.9441978248338849,
 0.9452458362554361,
 0.7075732312580467,
 -0.015979696071850125,
 -0.015979696071850125,
 -0.015979696071850125]


y_pred, score,score_test, coef = regression( Lasso(alpha=0.1), x_poly, y, x_poly, y)
plt.plot(x, y_pred)  #L = 0.0028
plt.scatter(x,y, s=10,color='r')
plt.title('accuracy = {}'.format(score_test))

Text(0.5, 1.0, 'accuracy = 0.9319986935578851')


coef

array([  0.        ,   4.32734531, -52.88751358,  44.6197943 ,
         0.        ,   9.05931541,   0.        ,   0.        ,
         0.        ,   0.        ,   0.        ,   0.        ,
         0.        ])


print('important features : ',np.nonzero(coef))

important features :  (array([1, 2, 3, 5], dtype=int64),)


x_data_new = x_poly[:,(1, 2, 3, 5)]


y_pred, score_train, score_test, coef = regression(LinearRegression(), x_selected_feature, y, x_selected_feature, y)


plt.plot(x, y_pred)  #L = 0.0028
plt.scatter(x, y, s=10, color='r')
plt.title('accuracy = {}'.format(score_train))

Text(0.5, 1.0, 'accuracy = 0.9334067494986096')


print('old data set shape', x_poly.shape)
print('new data set shape', x_selected_feature.shape)

old data set shape (30, 13)
new data set shape (30, 4)


alphas = [10e-4, 10e-3, 10e-2,10e-1,1]
weights = calc_weights(Ridge, alphas)
plot_weights(weights)


weights = np.array([])
alphas = [10e-1,1,5,7,10,20]
weights = calc_weights(Ridge, alphas)
plot_weights(weights)


kfold = KFold(3, True, 1)
# enumerate splits
for train, test in kfold.split(x_poly):
    print('train: %s, test: %s' % (train, test))

train: [ 0  1  2  4  5  6  7  8  9 11 12 13 15 16 18 23 25 27 28 29], test: [ 3 10 14 17 19 20 21 22 24 26]
train: [ 0  3  5  8  9 10 11 12 14 15 16 17 19 20 21 22 24 26 28 29], test: [ 1  2  4  6  7 13 18 23 25 27]
train: [ 1  2  3  4  6  7 10 13 14 17 18 19 20 21 22 23 24 25 26 27], test: [ 0  5  8  9 11 12 15 16 28 29]


Example of  spliting the data into 3 folds.


def cross_vall(model, x, y, folds=3):
    '''
    model : class  
     ML model
    x,y : like array
      data set
    number_of_splits : int
       number of folds
       
    Return : float
      Acuracy score
     
    '''
    kfold = KFold(folds, True, 1)
    scores= []
    for train, test in kfold.split(x_poly):
        y_pred, score_train, score_test, coef =  regression(model,x[train],y[train],x[test],y[test])
        scores.append(score_test)
    return scores


x_poly.shape
y.shape

(30, 1)


alphas = [3*10e-3,10e-3,10e-2,10e-1,0.03,0.07,0.06,1,5,7]
scores = []
for alpha in alphas:
    scores.append(np.array(cross_vall(Ridge(alpha=alpha),x_poly,y,folds=3)).mean())
scores

[0.6749867782522502,
 0.6992735672162587,
 0.6126383374897085,
 0.5080270426575648,
 0.6749867782522502,
 0.6292747814704289,
 0.6378164724640704,
 0.5080270426575648,
 0.2652262616536486,
 0.21533345216005315]


x_label=np.linspace(0,1,len(scores))
plt.plot(x_label,scores,label='test')
plt.xlabel('alpha')
plt.ylabel('scores')
plt.xticks(x_label, np.array(alphas).astype(str))
plt.legend()

<matplotlib.legend.Legend at 0x279d239310>


y_pred, score_train, score_test, coef = regression(Ridge(alpha=0.01),x_poly,y,x_poly,y)


plt.plot(x, y_pred)  #L = 0.0028
plt.scatter(x, y, s=10, color='r')

<matplotlib.collections.PathCollection at 0x279d1dbf40>


print(coef)

[[  0.           5.31024478 -55.9286906   37.39814768   3.69289909
   29.54764287  -3.1647536   -1.63375861 -10.73401512  -6.97375026
   -3.63912415   2.79407099   8.46307391]]

L1 and L2 Reguralization

author: daodeiv (David Stankov)

Polynomial Regression, Bias and Variance

Lasso Regression (L1 Regularization)

Lasso as feature selection

Ridge regression (L2 regularization)

K-fold cross validation

References

Polynomial Regression, Bias and Variance

Lasso Regression (L1 Regularization)

Lasso as feature selection

Ridge regression (L2 regularization)

K-fold cross validation

References