scikit-learn · agramfort · Apr 17, 2020 · Oct 10, 2019 · Oct 11, 2019 · Oct 15, 2019
diff --git a/sklearn/linear_model/_least_angle.py b/sklearn/linear_model/_least_angle.py
@@ -19,7 +19,7 @@
 
 from ._base import LinearModel
 from ..base import RegressorMixin, MultiOutputMixin
-from ..utils import arrayfuncs, as_float_array, check_X_y
+from ..utils import arrayfuncs, as_float_array, check_X_y, check_random_state
 from ..model_selection import check_cv
 from ..exceptions import ConvergenceWarning
 
@@ -799,6 +799,15 @@ class Lars(MultiOutputMixin, RegressorMixin, LinearModel):
         setting ``fit_path`` to ``False`` will lead to a speedup, especially
         with a small alpha.
 
+    jitter : float, default=None
+        Uniform noise parameter, added to the y values, to satisfy
+        the model's assumption of one-at-a-time computations.
+
+    random_state : int, RandomState instance or None (default)
+        Determines random number generation for dataset creation. Pass an int
+        for reproducible output across multiple function calls.
+        See :term:`Glossary <random_state>`.
+
     Attributes
     ----------
     alphas_ : array-like of shape (n_alphas + 1,) | list of n_targets such \
@@ -845,7 +854,8 @@ class Lars(MultiOutputMixin, RegressorMixin, LinearModel):
 
     def __init__(self, fit_intercept=True, verbose=False, normalize=True,
                  precompute='auto', n_nonzero_coefs=500,
-                 eps=np.finfo(np.float).eps, copy_X=True, fit_path=True):
+                 eps=np.finfo(np.float).eps, copy_X=True, fit_path=True,
+                 jitter=None, random_state=None):
         self.fit_intercept = fit_intercept
         self.verbose = verbose
         self.normalize = normalize
@@ -854,6 +864,8 @@ def __init__(self, fit_intercept=True, verbose=False, normalize=True,
         self.eps = eps
         self.copy_X = copy_X
         self.fit_path = fit_path
+        self.jitter = jitter
+        self.random_state = random_state
 
     @staticmethod
     def _get_gram(precompute, X, y):
@@ -953,6 +965,12 @@ def fit(self, X, y, Xy=None):
         else:
             max_iter = self.max_iter
 
+        if self.jitter is not None:
+            rng = check_random_state(self.random_state)
+
+            noise = rng.uniform(high=self.jitter, size=len(y))
+            y = y + noise
+
         self._fit(X, y, max_iter=max_iter, alpha=alpha, fit_path=self.fit_path,
                   Xy=Xy)
 
@@ -1030,6 +1048,15 @@ class LassoLars(Lars):
         algorithm are typically in congruence with the solution of the
         coordinate descent Lasso estimator.
 
+    jitter : float, default=None
+        Uniform noise parameter, added to the y values, to satisfy
+        the model's assumption of one-at-a-time computations.
+
+    random_state : int, RandomState instance or None (default)
+        Determines random number generation for dataset creation. Pass an int
+        for reproducible output across multiple function calls.
+        See :term:`Glossary <random_state>`.
+
     Attributes
     ----------
     alphas_ : array-like of shape (n_alphas + 1,) | list of n_targets such \
@@ -1082,7 +1109,7 @@ class LassoLars(Lars):
     def __init__(self, alpha=1.0, fit_intercept=True, verbose=False,
                  normalize=True, precompute='auto', max_iter=500,
                  eps=np.finfo(np.float).eps, copy_X=True, fit_path=True,
-                 positive=False):
+                 positive=False, jitter=None, random_state=None):
         self.alpha = alpha
         self.fit_intercept = fit_intercept
         self.max_iter = max_iter
@@ -1093,6 +1120,8 @@ def __init__(self, alpha=1.0, fit_intercept=True, verbose=False,
         self.copy_X = copy_X
         self.eps = eps
         self.fit_path = fit_path
+        self.jitter = jitter
+        self.random_state = random_state
 
 
 ###############################################################################
@@ -1710,7 +1739,8 @@ class LassoLarsIC(LassoLars):
     """
     def __init__(self, criterion='aic', fit_intercept=True, verbose=False,
                  normalize=True, precompute='auto', max_iter=500,
-                 eps=np.finfo(np.float).eps, copy_X=True, positive=False):
+                 eps=np.finfo(np.float).eps, copy_X=True, positive=False,
+                 random_state=None):
         self.criterion = criterion
         self.fit_intercept = fit_intercept
         self.positive = positive
@@ -1721,6 +1751,7 @@ def __init__(self, criterion='aic', fit_intercept=True, verbose=False,
         self.precompute = precompute
         self.eps = eps
         self.fit_path = True
+        self.random_state = random_state
 
     def _more_tags(self):
         return {'multioutput': False}

diff --git a/sklearn/linear_model/tests/test_least_angle.py b/sklearn/linear_model/tests/test_least_angle.py
@@ -733,6 +733,39 @@ def test_lasso_lars_fit_copyX_behaviour(copy_X):
     assert copy_X == np.array_equal(X, X_copy)
 
 
+@pytest.mark.parametrize('y_list, expected_y', [
+    ([-2.5, -2.5], [0, 2.5, 0, 2.5, 0]),
+    ([[-2.5, -2.5], [-2.5, -2.5]],
+     [[0, 5, 0, 2.5, 0], [0, 5, 0, 2.5, 0]])])
+def test_lars_with_jitter(y_list, expected_y):
+    """
+    Test that user input of a small amount of jitter,
+    using example provided in issue #2746
+
+    """
+
+    X = np.array([[0.0, 0.0, 0.0, -1.0, 0.0], [0.0, -1.0, 0.0, 0.0, 0.0]])
+    y = np.array(y_list)
+    expected_output = np.array(expected_y)
+    alpha = 0.001
+    fit_intercept = False
+
+    lars = linear_model.LassoLars(alpha=alpha, fit_intercept=fit_intercept)
+    lars_with_jitter = linear_model.LassoLars(alpha=alpha,
+                                              fit_intercept=fit_intercept,
+                                              jitter=10e-8,
+                                              random_state=0)
+
+    lars.fit(X, y)
+    lars_with_jitter.fit(X, y)
+
+    w_nojitter = lars.coef_
+    w_jitter = lars_with_jitter.coef_
+
+    assert not np.array_equal(w_jitter, w_nojitter)
+    assert_array_almost_equal(w_jitter, expected_output, decimal=2)
+
+
 def test_X_none_gram_not_none():
     with pytest.raises(ValueError,
                        match="X cannot be None if Gram is not None"):