#!/usr/bin/env python
# coding: utf-8

# ### Week 2: Demo Bias Variance Tradeoff
# 
# The demo covers the change in the bias and variance contributions to the MSE when the model complexity increases/decreases throughn either regularization or dimension reduction. 

# In[13]:


import numpy as np
import matplotlib.pyplot as plt 


# Generating noisy samples from a degree 3 polynomial

xtrain = np.linspace(-1,1,10)

xtest = np.linspace(-1,1, 50)


t = xtrain**3 + xtrain**2 + 2*xtrain + 1

t_test = xtest**3 + xtest**2 + 2*xtest + 1

tnoisy = t.reshape(-1,1) + np.random.normal(0,.4,len(xtrain)).reshape(-1,1)

plt.scatter(xtrain, tnoisy, c='r')
plt.plot(xtest, t_test)
plt.show()


# In[15]:


# for 100 XPs, we repeat the following experiment: we generate a 
# different set of noisy samples (x_i, t_i) and learn a degree 7 
# polynomial based on a ridge formulation with very mild level of 
# regularization

numXp = 100
from sklearn.preprocessing import PolynomialFeatures

numfeatures = 7
poly = PolynomialFeatures(numfeatures)

full_beta = np.zeros((numfeatures+1, numXp))


lbda = .0001

for i in range(numXp):
    
    # generating points
    tnoisy = t+np.random.normal(0,.6,len(xtrain))

    # fitting models
    
    
    Xtilde = poly.fit_transform(xtrain.reshape(-1,1))
    
    tmp_inv = np.linalg.inv(np.matmul(Xtilde.T, Xtilde) + lbda*np.eye(np.shape(np.matmul(Xtilde.T, Xtilde))[0]) ) 
    beta = np.matmul(tmp_inv, np.matmul(Xtilde.T, tnoisy))
    
    full_beta[:,i] = beta

    
# drawing the plot 

XtildeTest = poly.fit_transform(xtest.reshape(-1,1))

plt.scatter(xtrain, tnoisy, c='r', label = 'Samples')

for i in range(numXp):
    
    plt.plot(xtest, np.matmul(XtildeTest, full_beta[:,i]), c='b', alpha=.05)


plt.plot(xtest, t_test, c='g', label = 'True model')
plt.plot(xtest, np.matmul(XtildeTest, np.mean(full_beta, axis=1)), '--',c = 'r', label = 'Averaged model')

plt.legend()

plt.savefig('biasVariance2.png', dpi=300)


plt.show()


# In[16]:


# In order to study the result of a reduction in the model complexity, 
# we start by increasing the level of regularization, 
# setting the lambda to 10. 

numXp = 100
from sklearn.preprocessing import PolynomialFeatures

numfeatures = 7
poly = PolynomialFeatures(numfeatures)

full_beta = np.zeros((numfeatures+1, numXp))


lbda = 10

for i in range(numXp):
    
    # generating points
    tnoisy = t+np.random.normal(0,.6,len(xtrain))

    # fitting models
    
    
    Xtilde = poly.fit_transform(xtrain.reshape(-1,1))
    
    tmp_inv = np.linalg.inv(np.matmul(Xtilde.T, Xtilde) + lbda*np.eye(np.shape(np.matmul(Xtilde.T, Xtilde))[0]) ) 
    beta = np.matmul(tmp_inv, np.matmul(Xtilde.T, tnoisy))
    
    full_beta[:,i] = beta

    
# drawing the plot 

XtildeTest = poly.fit_transform(xtest.reshape(-1,1))

plt.scatter(xtrain, tnoisy, c='r', label = 'Samples')

for i in range(numXp):
    
    plt.plot(xtest, np.matmul(XtildeTest, full_beta[:,i]), c='b', alpha=.05)


plt.plot(xtest, t_test, c='g', label = 'True model')
plt.plot(xtest, np.matmul(XtildeTest, np.mean(full_beta, axis=1)), '--',c = 'r', label = 'Averaged model')

plt.legend()

plt.savefig('biasVariance2.png', dpi=300)


plt.show()


# In[17]:


# Finally, we study the effect on the bias and variance of a reduction in 
# the number of features. We repeat the experiments with a simple 
# linear model.  

numXp = 100
from sklearn.preprocessing import PolynomialFeatures

numfeatures = 1
poly = PolynomialFeatures(numfeatures)

full_beta = np.zeros((numfeatures+1, numXp))

for i in range(numXp):
    
    # generating points
    tnoisy = t+np.random.normal(0,.6,len(xtrain))

    # fitting models
    
    
    Xtilde = poly.fit_transform(xtrain.reshape(-1,1))
    
    tmp_inv = np.linalg.inv(np.matmul(Xtilde.T, Xtilde) + lbda*np.eye(np.shape(np.matmul(Xtilde.T, Xtilde))[0]) ) 
    beta = np.matmul(tmp_inv, np.matmul(Xtilde.T, tnoisy))
    
    full_beta[:,i] = beta

    
# drawing the plot 

XtildeTest = poly.fit_transform(xtest.reshape(-1,1))

plt.scatter(xtrain, tnoisy, c='r', label = 'Samples')

for i in range(numXp):
    
    plt.plot(xtest, np.matmul(XtildeTest, full_beta[:,i]), c='b', alpha=.05)


plt.plot(xtest, t_test, c='g', label = 'True model')
plt.plot(xtest, np.matmul(XtildeTest, np.mean(full_beta, axis=1)), '--',c = 'r', label = 'Averaged model')
plt.legend()

plt.savefig('biasVariance4.png', dpi=300)


plt.show()