
<br>
========================================<br>
Lasso and Elastic Net for Sparse Signals<br>
========================================<br>
Estimates Lasso and Elastic-Net regression models on a manually generated<br>
sparse signal corrupted with an additive noise. Estimated coefficients are<br>
compared with the ground-truth.<br>


In [None]:
print(__doc__)

In [None]:
import numpy as np
import matplotlib.pyplot as plt

In [None]:
from sklearn.metrics import r2_score

#############################################################################<br>
Generate some sparse data to play with

In [None]:
np.random.seed(42)

In [None]:
n_samples, n_features = 50, 100
X = np.random.randn(n_samples, n_features)

Decreasing coef w. alternated signs for visualization

In [None]:
idx = np.arange(n_features)
coef = (-1) ** idx * np.exp(-idx / 10)
coef[10:] = 0  # sparsify coef
y = np.dot(X, coef)

Add noise

In [None]:
y += 0.01 * np.random.normal(size=n_samples)

Split data in train set and test set

In [None]:
n_samples = X.shape[0]
X_train, y_train = X[:n_samples // 2], y[:n_samples // 2]
X_test, y_test = X[n_samples // 2:], y[n_samples // 2:]

#############################################################################<br>
Lasso

In [None]:
from sklearn.linear_model import Lasso

In [None]:
alpha = 0.1
lasso = Lasso(alpha=alpha)

In [None]:
y_pred_lasso = lasso.fit(X_train, y_train).predict(X_test)
r2_score_lasso = r2_score(y_test, y_pred_lasso)
print(lasso)
print("r^2 on test data : %f" % r2_score_lasso)

#############################################################################<br>
ElasticNet

In [None]:
from sklearn.linear_model import ElasticNet

In [None]:
enet = ElasticNet(alpha=alpha, l1_ratio=0.7)

In [None]:
y_pred_enet = enet.fit(X_train, y_train).predict(X_test)
r2_score_enet = r2_score(y_test, y_pred_enet)
print(enet)
print("r^2 on test data : %f" % r2_score_enet)

In [None]:
m, s, _ = plt.stem(np.where(enet.coef_)[0], enet.coef_[enet.coef_ != 0],
                   markerfmt='x', label='Elastic net coefficients',
                   use_line_collection=True)
plt.setp([m, s], color="#2ca02c")
m, s, _ = plt.stem(np.where(lasso.coef_)[0], lasso.coef_[lasso.coef_ != 0],
                   markerfmt='x', label='Lasso coefficients',
                   use_line_collection=True)
plt.setp([m, s], color='#ff7f0e')
plt.stem(np.where(coef)[0], coef[coef != 0], label='true coefficients',
         markerfmt='bx', use_line_collection=True)

In [None]:
plt.legend(loc='best')
plt.title("Lasso $R^2$: %.3f, Elastic Net $R^2$: %.3f"
          % (r2_score_lasso, r2_score_enet))
plt.show()