# Method Selector

In [1]:
from sklearn import linear_model, metrics
from sklearn.neighbors import KNeighborsRegressor
from sklearn.preprocessing import PolynomialFeatures, StandardScaler
from sklearn.model_selection import train_test_split, cross_val_score, KFold
from sklearn.linear_model import Lasso, Ridge, LassoCV, RidgeCV, LinearRegression

import numpy as np 
import pandas as pd 
import matplotlib.pyplot as plt
import seaborn as sns

from models import *

%matplotlib inline

In [2]:
# Diamond datafile
diamonds = pd.read_csv('diamonds.csv', index_col = 'Unnamed: 0')

In [3]:
# life expectancy datafile
life_exp = pd.read_csv('cleaned_life_expectancy.csv', index_col = 'Unnamed: 0')

In [4]:
# Diamond model evaluation table
diamond_eval = eval_df()

In [5]:
# Life expectation evaluation tabe 
life_exp_eval = eval_df()

In [6]:
regression(diamonds, ['carat','x','y','z','depth','table'], 'price', diamond_eval, regtype = 'Multivariate')

Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,1486.771,0.859,0.859,0.859,0.859,0.854


In [7]:
regression(diamonds, ['carat','x','y','z','depth','table'], 'price', diamond_eval, regtype = 'Multivariate', poly_deg=2)

Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,1486.771,0.859,0.859,0.859,0.859,0.854
1,Multivariate Polynomial Regression,2.0,,1886.163,0.876,0.876,0.774,0.773,-42.203


In [8]:
regression(diamonds, ['carat','x','y','z','depth','table'], 'price', diamond_eval, regtype = 'Multivariate', poly_deg=3)

Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,1486.771,0.859,0.859,0.859,0.859,0.854
1,Multivariate Polynomial Regression,2.0,,1886.163,0.876,0.876,0.774,0.773,-42.203
2,Multivariate Polynomial Regression,3.0,,1909.963,0.883,0.883,0.768,0.768,-452794.283


In [9]:
regression(diamonds, ['carat','x','y','z','depth','table'], 'price', diamond_eval, regtype = 'Lasso')

How many interations? 100000


Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,1486.771,0.859,0.859,0.859,0.859,0.854
1,Multivariate Polynomial Regression,2.0,,1886.163,0.876,0.876,0.774,0.773,-42.203
2,Multivariate Polynomial Regression,3.0,,1909.963,0.883,0.883,0.768,0.768,-452794.283
3,Lasso Linear Regression,1.0,Iterations: 100000 and Alpha: 3.685019951033...,1488.173,0.859,0.859,0.859,0.859,0.859


In [10]:
regression(diamonds, ['carat','x','y','z','depth','table'], 'price', diamond_eval, regtype = 'Lasso', poly_deg=2)

How many interations? 100000


Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,1486.771,0.859,0.859,0.859,0.859,0.854
1,Multivariate Polynomial Regression,2.0,,1886.163,0.876,0.876,0.774,0.773,-42.203
2,Multivariate Polynomial Regression,3.0,,1909.963,0.883,0.883,0.768,0.768,-452794.283
3,Lasso Linear Regression,1.0,Iterations: 100000 and Alpha: 3.685019951033...,1488.173,0.859,0.859,0.859,0.859,0.859
4,Lasso Polynomial Regression,2.0,Iterations: 100000 and Alpha: 352.612582868472,1537.234,0.849,0.849,0.85,0.85,-4.154


In [11]:
regression(diamonds, ['carat','x','y','z','depth','table'], 'price', diamond_eval, regtype = 'Lasso', poly_deg=3)

How many interations? 1000000


Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,1486.771,0.859,0.859,0.859,0.859,0.854
1,Multivariate Polynomial Regression,2.0,,1886.163,0.876,0.876,0.774,0.773,-42.203
2,Multivariate Polynomial Regression,3.0,,1909.963,0.883,0.883,0.768,0.768,-452794.283
3,Lasso Linear Regression,1.0,Iterations: 100000 and Alpha: 3.685019951033...,1488.173,0.859,0.859,0.859,0.859,0.859
4,Lasso Polynomial Regression,2.0,Iterations: 100000 and Alpha: 352.612582868472,1537.234,0.849,0.849,0.85,0.85,-4.154
5,Lasso Polynomial Regression,3.0,Iterations: 1000000 and Alpha: 1653.54684242...,2582.831,0.571,0.57,0.575,0.575,-416.423


In [12]:
# Best with alphas around 92
regression(diamonds, ['carat','x','y','z','depth','table'], 'price', diamond_eval, regtype = 'Ridge')

Enter alpha values seperated by spaces 90 91 92 93 94 95


Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,1486.771,0.859,0.859,0.859,0.859,0.854
1,Multivariate Polynomial Regression,2.0,,1886.163,0.876,0.876,0.774,0.773,-42.203
2,Multivariate Polynomial Regression,3.0,,1909.963,0.883,0.883,0.768,0.768,-452794.283
3,Lasso Linear Regression,1.0,Iterations: 100000 and Alpha: 3.685019951033...,1488.173,0.859,0.859,0.859,0.859,0.859
4,Lasso Polynomial Regression,2.0,Iterations: 100000 and Alpha: 352.612582868472,1537.234,0.849,0.849,0.85,0.85,-4.154
5,Lasso Polynomial Regression,3.0,Iterations: 1000000 and Alpha: 1653.54684242...,2582.831,0.571,0.57,0.575,0.575,-416.423
6,Ridge Linear Regression,1.0,Alpha: 92.0,1489.417,0.859,0.859,0.859,0.859,0.858


In [16]:
# High alpha values work much better
regression(diamonds, ['carat','x','y','z','depth','table'], 'price', diamond_eval, regtype = 'Ridge', poly_deg=2)

Enter alpha values seperated by spaces 300 3000 8464 10000


Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,1486.771,0.859,0.859,0.859,0.859,0.854
1,Multivariate Polynomial Regression,2.0,,1886.163,0.876,0.876,0.774,0.773,-42.203
2,Multivariate Polynomial Regression,3.0,,1909.963,0.883,0.883,0.768,0.768,-452794.283
3,Lasso Linear Regression,1.0,Iterations: 100000 and Alpha: 3.685019951033...,1488.173,0.859,0.859,0.859,0.859,0.859
4,Lasso Polynomial Regression,2.0,Iterations: 100000 and Alpha: 352.612582868472,1537.234,0.849,0.849,0.85,0.85,-4.154
5,Lasso Polynomial Regression,3.0,Iterations: 1000000 and Alpha: 1653.54684242...,2582.831,0.571,0.57,0.575,0.575,-416.423
6,Ridge Linear Regression,1.0,Alpha: 92.0,1489.417,0.859,0.859,0.859,0.859,0.858
7,Ridge Polynomial Regression,2.0,Alpha: 95.0,1520.13,0.875,0.875,0.853,0.853,-11.428
8,Ridge Polynomial Regression,2.0,Alpha: 160.0,1482.44,0.874,0.874,0.86,0.86,-7.425
9,Ridge Polynomial Regression,2.0,Alpha: 8462.0,1446.352,0.865,0.865,0.867,0.867,0.321


Now lets look at models on the life expectancy dataset

In [17]:
life_exp

Unnamed: 0,country,life_expectancy,alcohol,hepatitisB,measles,bmi,polio,diphtheria,hiv,total_expenditure,gdp,thinness_till19,inf_death,school,population,status,pop_size,death_ratio
0,Afghanistan,65.0,0.01,65.0,1154,19.1,6.0,65.0,0.1,8.16,584.259210,17.2,62,10.1,33736494.0,Developing,3,4.241935
1,Afghanistan,59.9,0.01,62.0,492,18.6,58.0,62.0,0.1,8.18,612.696514,17.5,64,10.0,327582.0,Developing,1,4.234375
2,Afghanistan,59.9,0.01,64.0,430,18.1,62.0,64.0,0.1,8.13,631.744976,17.7,66,9.9,31731688.0,Developing,3,4.060606
3,Afghanistan,59.5,0.01,67.0,2787,17.6,67.0,67.0,0.1,8.52,669.959000,17.9,69,9.8,3696958.0,Developing,2,3.942029
4,Afghanistan,59.2,0.01,68.0,3013,17.2,68.0,68.0,0.1,7.87,63.537231,18.2,71,9.5,2978599.0,Developing,2,3.873239
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2933,Zimbabwe,44.3,4.36,68.0,31,27.1,67.0,65.0,33.6,7.13,454.366654,9.4,27,9.2,12777511.0,Developing,3,26.777778
2934,Zimbabwe,44.5,4.06,7.0,998,26.7,7.0,68.0,36.7,6.52,453.351155,9.8,26,9.5,12633897.0,Developing,3,27.500000
2935,Zimbabwe,44.8,4.43,73.0,304,26.3,73.0,71.0,39.8,6.53,57.348340,1.2,25,10.0,125525.0,Developing,1,2.920000
2936,Zimbabwe,45.3,1.72,76.0,529,25.9,76.0,75.0,42.1,6.16,548.587312,1.6,25,9.8,12366165.0,Developing,3,27.440000


In [18]:
regression(life_exp, ['alcohol', 'hiv', 'gdp', 'school', 'death_ratio'], 'life_expectancy', life_exp_eval, regtype = 'Multivariate')

Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,4.646,0.751,0.75,0.711,0.708,0.746


In [19]:
regression(life_exp, ['alcohol', 'hiv', 'gdp', 'school', 'death_ratio'], 'life_expectancy', life_exp_eval, regtype = 'Multivariate', poly_deg= 2)

Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,4.646,0.751,0.75,0.711,0.708,0.746
1,Multivariate Polynomial Regression,2.0,,3.996,0.831,0.83,0.787,0.784,0.823


In [20]:
regression(life_exp, ['alcohol', 'hiv', 'gdp', 'school', 'death_ratio'], 'life_expectancy', life_exp_eval, regtype = 'Multivariate', poly_deg= 3)

Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,4.646,0.751,0.75,0.711,0.708,0.746
1,Multivariate Polynomial Regression,2.0,,3.996,0.831,0.83,0.787,0.784,0.823
2,Multivariate Polynomial Regression,3.0,,3.734,0.854,0.853,0.814,0.811,0.819


In [21]:
regression(life_exp, ['alcohol', 'hiv', 'gdp', 'school', 'death_ratio'], 'life_expectancy', life_exp_eval, regtype = 'Multivariate', poly_deg= 4)

Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,4.646,0.751,0.75,0.711,0.708,0.746
1,Multivariate Polynomial Regression,2.0,,3.996,0.831,0.83,0.787,0.784,0.823
2,Multivariate Polynomial Regression,3.0,,3.734,0.854,0.853,0.814,0.811,0.819
3,Multivariate Polynomial Regression,4.0,,3.54,0.877,0.877,0.832,0.83,-0.074


In [22]:
regression(life_exp, ['alcohol', 'hiv', 'gdp', 'school', 'death_ratio'], 'life_expectancy', life_exp_eval, regtype = 'Multivariate', poly_deg= 5)

Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,4.646,0.751,0.75,0.711,0.708,0.746
1,Multivariate Polynomial Regression,2.0,,3.996,0.831,0.83,0.787,0.784,0.823
2,Multivariate Polynomial Regression,3.0,,3.734,0.854,0.853,0.814,0.811,0.819
3,Multivariate Polynomial Regression,4.0,,3.54,0.877,0.877,0.832,0.83,-0.074
4,Multivariate Polynomial Regression,5.0,,23.292,0.902,0.902,-6.252,-6.341,-75.038


In [24]:
regression(life_exp, ['alcohol', 'hiv', 'gdp', 'school', 'death_ratio'], 'life_expectancy', life_exp_eval, regtype = 'Lasso')

How many interations? 100000


Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,4.646,0.751,0.75,0.711,0.708,0.746
1,Multivariate Polynomial Regression,2.0,,3.996,0.831,0.83,0.787,0.784,0.823
2,Multivariate Polynomial Regression,3.0,,3.734,0.854,0.853,0.814,0.811,0.819
3,Multivariate Polynomial Regression,4.0,,3.54,0.877,0.877,0.832,0.83,-0.074
4,Multivariate Polynomial Regression,5.0,,23.292,0.902,0.902,-6.252,-6.341,-75.038
5,Lasso Linear Regression,1.0,Iterations: 100000 and Alpha: 0.017256881441...,4.644,0.751,0.75,0.712,0.708,0.746


In [25]:
regression(life_exp, ['alcohol', 'hiv', 'gdp', 'school', 'death_ratio'], 'life_expectancy', life_exp_eval, regtype = 'Lasso', poly_deg=2)

How many interations? 100000


Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,4.646,0.751,0.75,0.711,0.708,0.746
1,Multivariate Polynomial Regression,2.0,,3.996,0.831,0.83,0.787,0.784,0.823
2,Multivariate Polynomial Regression,3.0,,3.734,0.854,0.853,0.814,0.811,0.819
3,Multivariate Polynomial Regression,4.0,,3.54,0.877,0.877,0.832,0.83,-0.074
4,Multivariate Polynomial Regression,5.0,,23.292,0.902,0.902,-6.252,-6.341,-75.038
5,Lasso Linear Regression,1.0,Iterations: 100000 and Alpha: 0.017256881441...,4.644,0.751,0.75,0.712,0.708,0.746
6,Lasso Polynomial Regression,2.0,Iterations: 100000 and Alpha: 0.019167177496...,3.986,0.83,0.829,0.788,0.785,0.823


In [26]:
regression(life_exp, ['alcohol', 'hiv', 'gdp', 'school', 'death_ratio'], 'life_expectancy', life_exp_eval, regtype = 'Lasso', poly_deg=3)

How many interations? 100000


Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,4.646,0.751,0.75,0.711,0.708,0.746
1,Multivariate Polynomial Regression,2.0,,3.996,0.831,0.83,0.787,0.784,0.823
2,Multivariate Polynomial Regression,3.0,,3.734,0.854,0.853,0.814,0.811,0.819
3,Multivariate Polynomial Regression,4.0,,3.54,0.877,0.877,0.832,0.83,-0.074
4,Multivariate Polynomial Regression,5.0,,23.292,0.902,0.902,-6.252,-6.341,-75.038
5,Lasso Linear Regression,1.0,Iterations: 100000 and Alpha: 0.017256881441...,4.644,0.751,0.75,0.712,0.708,0.746
6,Lasso Polynomial Regression,2.0,Iterations: 100000 and Alpha: 0.019167177496...,3.986,0.83,0.829,0.788,0.785,0.823
7,Lasso Polynomial Regression,3.0,Iterations: 100000 and Alpha: 0.108389123248...,3.934,0.835,0.834,0.793,0.791,0.826


In [27]:
regression(life_exp, ['alcohol', 'hiv', 'gdp', 'school', 'death_ratio'], 'life_expectancy', life_exp_eval, regtype = 'Lasso', poly_deg=4)

How many interations? 100000


Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,4.646,0.751,0.75,0.711,0.708,0.746
1,Multivariate Polynomial Regression,2.0,,3.996,0.831,0.83,0.787,0.784,0.823
2,Multivariate Polynomial Regression,3.0,,3.734,0.854,0.853,0.814,0.811,0.819
3,Multivariate Polynomial Regression,4.0,,3.54,0.877,0.877,0.832,0.83,-0.074
4,Multivariate Polynomial Regression,5.0,,23.292,0.902,0.902,-6.252,-6.341,-75.038
5,Lasso Linear Regression,1.0,Iterations: 100000 and Alpha: 0.017256881441...,4.644,0.751,0.75,0.712,0.708,0.746
6,Lasso Polynomial Regression,2.0,Iterations: 100000 and Alpha: 0.019167177496...,3.986,0.83,0.829,0.788,0.785,0.823
7,Lasso Polynomial Regression,3.0,Iterations: 100000 and Alpha: 0.108389123248...,3.934,0.835,0.834,0.793,0.791,0.826
8,Lasso Polynomial Regression,4.0,Iterations: 100000 and Alpha: 0.667883866400...,4.477,0.773,0.772,0.732,0.729,0.755


In [29]:
regression(life_exp, ['alcohol', 'hiv', 'gdp', 'school', 'death_ratio'], 'life_expectancy', life_exp_eval, regtype = 'Ridge')

Enter alpha values seperated by spaces 0.1 0.2 0.3 0.4 0.5 0.6 0.7 0.8 0.9 1


Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,4.646,0.751,0.75,0.711,0.708,0.746
1,Multivariate Polynomial Regression,2.0,,3.996,0.831,0.83,0.787,0.784,0.823
2,Multivariate Polynomial Regression,3.0,,3.734,0.854,0.853,0.814,0.811,0.819
3,Multivariate Polynomial Regression,4.0,,3.54,0.877,0.877,0.832,0.83,-0.074
4,Multivariate Polynomial Regression,5.0,,23.292,0.902,0.902,-6.252,-6.341,-75.038
5,Lasso Linear Regression,1.0,Iterations: 100000 and Alpha: 0.017256881441...,4.644,0.751,0.75,0.712,0.708,0.746
6,Lasso Polynomial Regression,2.0,Iterations: 100000 and Alpha: 0.019167177496...,3.986,0.83,0.829,0.788,0.785,0.823
7,Lasso Polynomial Regression,3.0,Iterations: 100000 and Alpha: 0.108389123248...,3.934,0.835,0.834,0.793,0.791,0.826
8,Lasso Polynomial Regression,4.0,Iterations: 100000 and Alpha: 0.667883866400...,4.477,0.773,0.772,0.732,0.729,0.755
9,Ridge Linear Regression,1.0,Alpha: 1.0,4.646,0.751,0.75,0.712,0.708,0.746


In [30]:
regression(life_exp, ['alcohol', 'hiv', 'gdp', 'school', 'death_ratio'], 'life_expectancy', life_exp_eval, regtype = 'Ridge')

Enter alpha values seperated by spaces 1 5 10 15 20 25 40 80


Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,4.646,0.751,0.75,0.711,0.708,0.746
1,Multivariate Polynomial Regression,2.0,,3.996,0.831,0.83,0.787,0.784,0.823
2,Multivariate Polynomial Regression,3.0,,3.734,0.854,0.853,0.814,0.811,0.819
3,Multivariate Polynomial Regression,4.0,,3.54,0.877,0.877,0.832,0.83,-0.074
4,Multivariate Polynomial Regression,5.0,,23.292,0.902,0.902,-6.252,-6.341,-75.038
5,Lasso Linear Regression,1.0,Iterations: 100000 and Alpha: 0.017256881441...,4.644,0.751,0.75,0.712,0.708,0.746
6,Lasso Polynomial Regression,2.0,Iterations: 100000 and Alpha: 0.019167177496...,3.986,0.83,0.829,0.788,0.785,0.823
7,Lasso Polynomial Regression,3.0,Iterations: 100000 and Alpha: 0.108389123248...,3.934,0.835,0.834,0.793,0.791,0.826
8,Lasso Polynomial Regression,4.0,Iterations: 100000 and Alpha: 0.667883866400...,4.477,0.773,0.772,0.732,0.729,0.755
9,Ridge Linear Regression,1.0,Alpha: 1.0,4.646,0.751,0.75,0.712,0.708,0.746


In [31]:
regression(life_exp, ['alcohol', 'hiv', 'gdp', 'school', 'death_ratio'], 'life_expectancy', life_exp_eval, regtype = 'Ridge')

Enter alpha values seperated by spaces 2 3 4 5 6 7 8


Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,4.646,0.751,0.75,0.711,0.708,0.746
1,Multivariate Polynomial Regression,2.0,,3.996,0.831,0.83,0.787,0.784,0.823
2,Multivariate Polynomial Regression,3.0,,3.734,0.854,0.853,0.814,0.811,0.819
3,Multivariate Polynomial Regression,4.0,,3.54,0.877,0.877,0.832,0.83,-0.074
4,Multivariate Polynomial Regression,5.0,,23.292,0.902,0.902,-6.252,-6.341,-75.038
5,Lasso Linear Regression,1.0,Iterations: 100000 and Alpha: 0.017256881441...,4.644,0.751,0.75,0.712,0.708,0.746
6,Lasso Polynomial Regression,2.0,Iterations: 100000 and Alpha: 0.019167177496...,3.986,0.83,0.829,0.788,0.785,0.823
7,Lasso Polynomial Regression,3.0,Iterations: 100000 and Alpha: 0.108389123248...,3.934,0.835,0.834,0.793,0.791,0.826
8,Lasso Polynomial Regression,4.0,Iterations: 100000 and Alpha: 0.667883866400...,4.477,0.773,0.772,0.732,0.729,0.755
9,Ridge Linear Regression,1.0,Alpha: 1.0,4.646,0.751,0.75,0.712,0.708,0.746


In [32]:
regression(life_exp, ['alcohol', 'hiv', 'gdp', 'school', 'death_ratio'], 'life_expectancy', life_exp_eval, regtype = 'Ridge', poly_deg= 2)

Enter alpha values seperated by spaces 6 7 8 9 10 40


Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,4.646,0.751,0.75,0.711,0.708,0.746
1,Multivariate Polynomial Regression,2.0,,3.996,0.831,0.83,0.787,0.784,0.823
2,Multivariate Polynomial Regression,3.0,,3.734,0.854,0.853,0.814,0.811,0.819
3,Multivariate Polynomial Regression,4.0,,3.54,0.877,0.877,0.832,0.83,-0.074
4,Multivariate Polynomial Regression,5.0,,23.292,0.902,0.902,-6.252,-6.341,-75.038
5,Lasso Linear Regression,1.0,Iterations: 100000 and Alpha: 0.017256881441...,4.644,0.751,0.75,0.712,0.708,0.746
6,Lasso Polynomial Regression,2.0,Iterations: 100000 and Alpha: 0.019167177496...,3.986,0.83,0.829,0.788,0.785,0.823
7,Lasso Polynomial Regression,3.0,Iterations: 100000 and Alpha: 0.108389123248...,3.934,0.835,0.834,0.793,0.791,0.826
8,Lasso Polynomial Regression,4.0,Iterations: 100000 and Alpha: 0.667883866400...,4.477,0.773,0.772,0.732,0.729,0.755
9,Ridge Linear Regression,1.0,Alpha: 1.0,4.646,0.751,0.75,0.712,0.708,0.746


In [33]:
regression(life_exp, ['alcohol', 'hiv', 'gdp', 'school', 'death_ratio'], 'life_expectancy', life_exp_eval, regtype = 'Ridge', poly_deg=2)

Enter alpha values seperated by spaces 1 2 3 4 5 6


Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,4.646,0.751,0.75,0.711,0.708,0.746
1,Multivariate Polynomial Regression,2.0,,3.996,0.831,0.83,0.787,0.784,0.823
2,Multivariate Polynomial Regression,3.0,,3.734,0.854,0.853,0.814,0.811,0.819
3,Multivariate Polynomial Regression,4.0,,3.54,0.877,0.877,0.832,0.83,-0.074
4,Multivariate Polynomial Regression,5.0,,23.292,0.902,0.902,-6.252,-6.341,-75.038
5,Lasso Linear Regression,1.0,Iterations: 100000 and Alpha: 0.017256881441...,4.644,0.751,0.75,0.712,0.708,0.746
6,Lasso Polynomial Regression,2.0,Iterations: 100000 and Alpha: 0.019167177496...,3.986,0.83,0.829,0.788,0.785,0.823
7,Lasso Polynomial Regression,3.0,Iterations: 100000 and Alpha: 0.108389123248...,3.934,0.835,0.834,0.793,0.791,0.826
8,Lasso Polynomial Regression,4.0,Iterations: 100000 and Alpha: 0.667883866400...,4.477,0.773,0.772,0.732,0.729,0.755
9,Ridge Linear Regression,1.0,Alpha: 1.0,4.646,0.751,0.75,0.712,0.708,0.746


In [34]:
regression(life_exp, ['alcohol', 'hiv', 'gdp', 'school', 'death_ratio'], 'life_expectancy', life_exp_eval, regtype = 'Ridge', poly_deg= 3)

Enter alpha values seperated by spaces 2 3 4 5 6 




Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,4.646,0.751,0.75,0.711,0.708,0.746
1,Multivariate Polynomial Regression,2.0,,3.996,0.831,0.83,0.787,0.784,0.823
2,Multivariate Polynomial Regression,3.0,,3.734,0.854,0.853,0.814,0.811,0.819
3,Multivariate Polynomial Regression,4.0,,3.54,0.877,0.877,0.832,0.83,-0.074
4,Multivariate Polynomial Regression,5.0,,23.292,0.902,0.902,-6.252,-6.341,-75.038
5,Lasso Linear Regression,1.0,Iterations: 100000 and Alpha: 0.017256881441...,4.644,0.751,0.75,0.712,0.708,0.746
6,Lasso Polynomial Regression,2.0,Iterations: 100000 and Alpha: 0.019167177496...,3.986,0.83,0.829,0.788,0.785,0.823
7,Lasso Polynomial Regression,3.0,Iterations: 100000 and Alpha: 0.108389123248...,3.934,0.835,0.834,0.793,0.791,0.826
8,Lasso Polynomial Regression,4.0,Iterations: 100000 and Alpha: 0.667883866400...,4.477,0.773,0.772,0.732,0.729,0.755
9,Ridge Linear Regression,1.0,Alpha: 1.0,4.646,0.751,0.75,0.712,0.708,0.746


In [35]:
regression(life_exp, ['alcohol', 'hiv', 'gdp', 'school', 'death_ratio'], 'life_expectancy', life_exp_eval, regtype = 'Ridge', poly_deg= 4)

Enter alpha values seperated by spaces 5 6 7 8 9




Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,4.646,0.751,0.75,0.711,0.708,0.746
1,Multivariate Polynomial Regression,2.0,,3.996,0.831,0.83,0.787,0.784,0.823
2,Multivariate Polynomial Regression,3.0,,3.734,0.854,0.853,0.814,0.811,0.819
3,Multivariate Polynomial Regression,4.0,,3.54,0.877,0.877,0.832,0.83,-0.074
4,Multivariate Polynomial Regression,5.0,,23.292,0.902,0.902,-6.252,-6.341,-75.038
5,Lasso Linear Regression,1.0,Iterations: 100000 and Alpha: 0.017256881441...,4.644,0.751,0.75,0.712,0.708,0.746
6,Lasso Polynomial Regression,2.0,Iterations: 100000 and Alpha: 0.019167177496...,3.986,0.83,0.829,0.788,0.785,0.823
7,Lasso Polynomial Regression,3.0,Iterations: 100000 and Alpha: 0.108389123248...,3.934,0.835,0.834,0.793,0.791,0.826
8,Lasso Polynomial Regression,4.0,Iterations: 100000 and Alpha: 0.667883866400...,4.477,0.773,0.772,0.732,0.729,0.755
9,Ridge Linear Regression,1.0,Alpha: 1.0,4.646,0.751,0.75,0.712,0.708,0.746


In [36]:
diamond_eval

Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,1486.771,0.859,0.859,0.859,0.859,0.854
1,Multivariate Polynomial Regression,2.0,,1886.163,0.876,0.876,0.774,0.773,-42.203
2,Multivariate Polynomial Regression,3.0,,1909.963,0.883,0.883,0.768,0.768,-452794.283
3,Lasso Linear Regression,1.0,Iterations: 100000 and Alpha: 3.685019951033...,1488.173,0.859,0.859,0.859,0.859,0.859
4,Lasso Polynomial Regression,2.0,Iterations: 100000 and Alpha: 352.612582868472,1537.234,0.849,0.849,0.85,0.85,-4.154
5,Lasso Polynomial Regression,3.0,Iterations: 1000000 and Alpha: 1653.54684242...,2582.831,0.571,0.57,0.575,0.575,-416.423
6,Ridge Linear Regression,1.0,Alpha: 92.0,1489.417,0.859,0.859,0.859,0.859,0.858
7,Ridge Polynomial Regression,2.0,Alpha: 95.0,1520.13,0.875,0.875,0.853,0.853,-11.428
8,Ridge Polynomial Regression,2.0,Alpha: 160.0,1482.44,0.874,0.874,0.86,0.86,-7.425
9,Ridge Polynomial Regression,2.0,Alpha: 8462.0,1446.352,0.865,0.865,0.867,0.867,0.321


In [37]:
life_exp_eval

Unnamed: 0,Model,Power,Hyper Parameters,Root Mean Squared Error (RMSE),R-squared (training),Adjusted R-squared (training),R-squared (test),Adjusted R-squared (test),5-Fold Cross Validation
0,Multivariate Linear Regression,1.0,,4.646,0.751,0.75,0.711,0.708,0.746
1,Multivariate Polynomial Regression,2.0,,3.996,0.831,0.83,0.787,0.784,0.823
2,Multivariate Polynomial Regression,3.0,,3.734,0.854,0.853,0.814,0.811,0.819
3,Multivariate Polynomial Regression,4.0,,3.54,0.877,0.877,0.832,0.83,-0.074
4,Multivariate Polynomial Regression,5.0,,23.292,0.902,0.902,-6.252,-6.341,-75.038
5,Lasso Linear Regression,1.0,Iterations: 100000 and Alpha: 0.017256881441...,4.644,0.751,0.75,0.712,0.708,0.746
6,Lasso Polynomial Regression,2.0,Iterations: 100000 and Alpha: 0.019167177496...,3.986,0.83,0.829,0.788,0.785,0.823
7,Lasso Polynomial Regression,3.0,Iterations: 100000 and Alpha: 0.108389123248...,3.934,0.835,0.834,0.793,0.791,0.826
8,Lasso Polynomial Regression,4.0,Iterations: 100000 and Alpha: 0.667883866400...,4.477,0.773,0.772,0.732,0.729,0.755
9,Ridge Linear Regression,1.0,Alpha: 1.0,4.646,0.751,0.75,0.712,0.708,0.746
