In [3]:
import numpy as np
from sklearn import linear_model
import sklearn.metrics as sm
from sklearn.preprocessing import PolynomialFeatures

# Input file
input_file = 'data_multivar_regr.txt'

# Load the file
data = np.loadtxt(input_file, delimiter=',')
X, y = data[:, :-1], data[:, -1]

# Split data into training and testing
num_training = int(0.8 * len(X))
num_test = len(X) - num_training

# Training data
X_train, y_train = X[:num_training], y[:num_training]
X_test, y_test = X[num_training:], y[num_training:]

# Create the linear regressor model
linear_regressor = linear_model.LinearRegression()

# Train the model using the training sets
linear_regressor.fit(X_train, y_train)

# Predict the output
y_test_pred = linear_regressor.predict(X_test)

# Compute performance metrics
print('Linear regressor performance')
print('Mean absolute error = {}'.format(round(sm.mean_absolute_error(y_test, y_test_pred), 2)))
print('Mean squared error = {}'.format(round(sm.mean_squared_error(y_test, y_test_pred), 2)))
print('Median absolute error = {}'.format(round(sm.median_absolute_error(y_test, y_test_pred), 2)))
print('Explain variance score = {}'.format(round(sm.explained_variance_score(y_test, y_test_pred), 2)))
print('R2 score = {}'.format(sm.r2_score(y_test, y_test_pred), 2))

# Polynomial Regression
polynomial = PolynomialFeatures(degree=10)
X_train_transformed = polynomial.fit_transform(X_train)
datapoint = [[7.75, 6.35, 5.56]]
poly_datapoint = polynomial.fit_transform(datapoint)

# Create linear model to compare the difference
poly_linear_model = linear_model.LinearRegression()
poly_linear_model.fit(X_train_transformed, y_train)

print('\nLinear regression:', linear_regressor.predict(datapoint))
print('\nPolynomial regression:', poly_linear_model.predict(poly_datapoint))

Linear regressor performance
Mean absolute error = 3.58
Mean squared error = 20.31
Median absolute error = 2.99
Explain variance score = 0.86
R2 score = 0.8648119185190575

Linear regression: [ 36.05286276]

Polynomial regression: [ 41.47360915]
