## **Non-Negative least squares**

In [None]:
import numpy as np
import matplotlib.pyplot as plt
from sklearn.metrics import r2_score

In [None]:
# Generate some random data

np.random.seed(42)

n_samples, n_features = 200, 50
X = np.random.randn(n_samples, n_features)

true_coef = 3 * np.random.randn(n_features)

In [None]:
# Threshold coefficients to render them non-negative

true_coef[true_coef < 0] = 0
y = np.dot(X, true_coef)

In [None]:
# Add some noise

y += 5 * np.random.normal(size=(n_samples, ))

In [None]:
# Split the data in train set and test set

from sklearn.model_selection import train_test_split

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.5)

In [None]:
# Fit the Non-Negative least squares

from sklearn.linear_model import LinearRegression

# Scikit-Learn version Error
reg_nnls = LinearRegression(positive=True)
y_pred_nnls = reg_nnls.fit(X_train, y_train).predict(X_test)

r2_score_nnls = r2_score(y_test, y_pred_nnls)
print("NNLS R2 Score : {0}".format(r2_score_nnls))

TypeError: ignored

In [None]:
# Fit an OLS

from sklearn.linear_model import LinearRegression

reg_ols = LinearRegression()
y_pred_ols = reg_ols.fit(X_train, y_train).predict(X_test)

r2_score_ols = r2_score(y_test, y_pred_ols)
print("OLS R2 Score : {0}".format(r2_score_ols))

In [None]:
# Compare the regression coefficients between OLS and NNLS

fig, ax = plt.subplots()
ax.plot(reg_ols.coef_, reg_nnls.coef_, linewidth=0, marker='.')

low_x, high_x = ax.get_xlim()
low_y, high_y = ax.get_ylim()

low = max(low_x, low_y)
high = min(high_x, high_y)

ax.plot([low, high], [low, high], ls='--', c='.3', alpha=.5)
ax.set_xlabel("OLS regression coefficients", fontweight="bold")
ax.set_ylabel("NNLS regression coefficients", fontweight="bold")