scikit-learn · jnothman · Jul 15, 2020 · Jul 15, 2020 · Jul 15, 2020 · mitar
diff --git a/doc/conf.py b/doc/conf.py
@@ -59,6 +59,10 @@
     mathjax_path = ('https://cdn.jsdelivr.net/npm/mathjax@3/es5/'
                     'tex-chtml.js')
 
+rst_prolog = r"""
+.. include:: /includes/prolog.rst
+"""
+
 autodoc_default_options = {
     'members': True,
     'inherited-members': True
@@ -438,7 +442,6 @@ def generate_min_dependency_table(app):
 # we use the issues path for PRs since the issues URL will forward
 issues_github_path = 'scikit-learn/scikit-learn'
 
-
 def setup(app):
     app.connect('builder-inited', generate_min_dependency_table)
     # to hide/show the prompt in code examples:

diff --git a/doc/glossary.rst b/doc/glossary.rst
@@ -198,6 +198,11 @@ General Concepts
         exceptional behaviours on the estimator using semantic :term:`estimator
         tags`.
 
+    control parameter
+        A :term:`parameter` that configures the logic of an estimator or
+        function, and should ordinarily be determined by the task rather
+        than be subject to :term:`tuning <tuning parameter>`.
+
     deprecation
         We use deprecation to slowly violate our :term:`backwards
         compatibility` assurances, usually to to:
@@ -601,6 +606,9 @@ General Concepts
         called.
 
         Common parameters are listed :ref:`below <glossary_parameters>`.
+        Parameters in API Reference may be labelled as being one of:
+        :term:`control parameter`, :term:`tuning parameter` and
+        :term:`resources parameter`.
 
     pairwise metric
     pairwise metrics
@@ -653,6 +661,10 @@ General Concepts
         vectors, etc. The purpose of a :term:`vectorizer` is to produce
         rectangular forms of such data.
 
+    resources parameter
+        A :term:`parameter` that does not affect the result of modelling, but
+        may help with resource utilization or tracking.
+
     sample
     samples
         We usually use this term as a noun to indicate a single feature vector.
@@ -765,6 +777,12 @@ General Concepts
         :class:`cluster.AgglomerativeClustering` and
         :class:`neighbors.LocalOutlierFactor`.
 
+    tuning parameter
+        A :term:`parameter` that may need to be tuned (such as with :ref:`model
+        selection tools <grid_search>`) for the estimator to produce its best
+        model, but which does not affect the class or logic of the model as
+        a :term:`control parameter` might.
+
     unlabeled
     unlabeled data
         Samples with an unknown ground truth when fitting; equivalently,

diff --git a/doc/includes/prolog.rst b/doc/includes/prolog.rst
@@ -0,0 +1,9 @@
+.. role:: raw-html(raw)
+   :format: html
+
+.. role:: raw-latex(raw)
+   :format: latex
+
+.. |ControlParameter| replace:: :raw-html:`<a class="paramtype" href="../../glossary.html#term-control-parameter" title="Glossary on Control Parameter"><span class="badge badge-primary">Control</span></a>` :raw-latex:`{\small\sc [Control Parameter]}`
+.. |TuningParameter| replace:: :raw-html:`<a class="paramtype" href="../../glossary.html#term-control-parameter" title="Glossary on Tuning Parameter"><span class="badge badge-warning">Tuning</span></a>` :raw-latex:`{\small\sc [Tuning Parameter]}`
+.. |ResourcesParameter| replace:: :raw-html:`<a class="paramtype" href="../../glossary.html#term-control-parameter" title="Glossary on Resources Parameter"><span class="badge badge-secondary">Resources</span></a>` :raw-latex:`{\small\sc [Resources Parameter]}`
diff --git a/doc/whats_new/_contributors.rst b/doc/whats_new/_contributors.rst
@@ -6,12 +6,6 @@
     hyperlink all contributors' names, and ``:user:`` should now be preferred.
     It also defines other ReST substitutions.
 
-.. role:: raw-html(raw)
-   :format: html
-
-.. role:: raw-latex(raw)
-   :format: latex
-
 .. |MajorFeature| replace:: :raw-html:`<span class="badge badge-success">Major Feature</span>` :raw-latex:`{\small\sc [Major Feature]}`
 .. |Feature| replace:: :raw-html:`<span class="badge badge-success">Feature</span>` :raw-latex:`{\small\sc [Feature]}`
 .. |Efficiency| replace:: :raw-html:`<span class="badge badge-info">Efficiency</span>` :raw-latex:`{\small\sc [Efficiency]}`
@@ -176,4 +170,4 @@
 
 .. _Nicolas Hug: https://github.com/NicolasHug
 
-.. _Guillaume Lemaitre: https://github.com/glemaitre
+.. _Guillaume Lemaitre: https://github.com/glemaitre
diff --git a/sklearn/linear_model/_logistic.py b/sklearn/linear_model/_logistic.py
@@ -1043,6 +1043,8 @@ class LogisticRegression(LinearClassifierMixin,
         only supported by the 'saga' solver. If 'none' (not supported by the
         liblinear solver), no regularization is applied.
 
+        |ControlParameter|
+
         .. versionadded:: 0.19
            l1 penalty with SAGA solver (allowing 'multinomial' + L1)
 
@@ -1051,18 +1053,26 @@ class LogisticRegression(LinearClassifierMixin,
         l2 penalty with liblinear solver. Prefer dual=False when
         n_samples > n_features.
 
+        |TuningParameter|
+
     tol : float, default=1e-4
         Tolerance for stopping criteria.
 
+        |TuningParameter|
+
     C : float, default=1.0
         Inverse of regularization strength; must be a positive float.
         Like in support vector machines, smaller values specify stronger
         regularization.
 
+        |TuningParameter|
+
     fit_intercept : bool, default=True
         Specifies if a constant (a.k.a. bias or intercept) should be
         added to the decision function.
 
+        |ControlParameter|
+
     intercept_scaling : float, default=1
         Useful only when the solver 'liblinear' is used
         and self.fit_intercept is set to True. In this case, x becomes
@@ -1076,6 +1086,8 @@ class LogisticRegression(LinearClassifierMixin,
         To lessen the effect of regularization on synthetic feature weight
         (and therefore on the intercept) intercept_scaling has to be increased.
 
+        |TuningParameter|
+
     class_weight : dict or 'balanced', default=None
         Weights associated with classes in the form ``{class_label: weight}``.
         If not given, all classes are supposed to have weight one.
@@ -1087,13 +1099,17 @@ class LogisticRegression(LinearClassifierMixin,
         Note that these weights will be multiplied with sample_weight (passed
         through the fit method) if sample_weight is specified.
 
+        |ControlParameter|
+
         .. versionadded:: 0.17
            *class_weight='balanced'*
 
     random_state : int, RandomState instance, default=None
         Used when ``solver`` == 'sag', 'saga' or 'liblinear' to shuffle the
         data. See :term:`Glossary <random_state>` for details.
 
+        |ControlParameter|
+
     solver : {'newton-cg', 'lbfgs', 'liblinear', 'sag', 'saga'}, \
             default='lbfgs'
 
@@ -1113,6 +1129,8 @@ class LogisticRegression(LinearClassifierMixin,
         features with approximately the same scale. You can
         preprocess the data with a scaler from sklearn.preprocessing.
 
+        |TuningParameter|
+
         .. versionadded:: 0.17
            Stochastic Average Gradient descent solver.
         .. versionadded:: 0.19
@@ -1123,6 +1141,8 @@ class LogisticRegression(LinearClassifierMixin,
     max_iter : int, default=100
         Maximum number of iterations taken for the solvers to converge.
 
+        |TuningParameter|
+
     multi_class : {'auto', 'ovr', 'multinomial'}, default='auto'
         If the option chosen is 'ovr', then a binary problem is fit for each
         label. For 'multinomial' the loss minimised is the multinomial loss fit
@@ -1131,6 +1151,8 @@ class LogisticRegression(LinearClassifierMixin,
         'auto' selects 'ovr' if the data is binary, or if solver='liblinear',
         and otherwise selects 'multinomial'.
 
+        |ControlParameter|
+
         .. versionadded:: 0.18
            Stochastic Average Gradient descent solver for 'multinomial' case.
         .. versionchanged:: 0.22
@@ -1140,11 +1162,15 @@ class LogisticRegression(LinearClassifierMixin,
         For the liblinear and lbfgs solvers set verbose to any positive
         number for verbosity.
 
+        |ResourcesParameter|
+
     warm_start : bool, default=False
         When set to True, reuse the solution of the previous call to fit as
         initialization, otherwise, just erase the previous solution.
         Useless for liblinear solver. See :term:`the Glossary <warm_start>`.
 
+        |ResourcesParameter|
+
         .. versionadded:: 0.17
            *warm_start* to support *lbfgs*, *newton-cg*, *sag*, *saga* solvers.
 
@@ -1156,13 +1182,17 @@ class LogisticRegression(LinearClassifierMixin,
         context. ``-1`` means using all processors.
         See :term:`Glossary <n_jobs>` for more details.
 
+        |ResourcesParameter|
+
     l1_ratio : float, default=None
         The Elastic-Net mixing parameter, with ``0 <= l1_ratio <= 1``. Only
         used if ``penalty='elasticnet'``. Setting ``l1_ratio=0`` is equivalent
         to using ``penalty='l2'``, while setting ``l1_ratio=1`` is equivalent
         to using ``penalty='l1'``. For ``0 < l1_ratio <1``, the penalty is a
         combination of L1 and L2.
 
+        |TuningParameter|
+
     Attributes
     ----------