sdpython · sdpython · Jul 19, 2022 · Jul 19, 2022
diff --git a/_doc/examples/plot_constraint_kmeans.py b/_doc/examples/plot_constraint_kmeans.py
@@ -57,7 +57,7 @@
     x = [km.cluster_centers_[i, 0], km.cluster_centers_[i, 0]]
     y = [km.cluster_centers_[i, 1], km.cluster_centers_[i, 1]]
     ax.plot(x, y, colors[i] + '+')
-ax.set_title('KMeans 4 clusters\n%r' % hist)
+ax.set_title(f'KMeans 4 clusters\n{hist!r}')
 ax.legend()
 
 #####################################
@@ -94,9 +94,9 @@
     x = [km2.cluster_centers_[i, 0], km2.cluster_centers_[i, 0]]
     y = [km2.cluster_centers_[i, 1], km2.cluster_centers_[i, 1]]
     ax[1].plot(x, y, colors[i] + '+')
-ax[0].set_title('ConstraintKMeans 4 clusters (gains)\n%r' % hist1)
+ax[0].set_title(f'ConstraintKMeans 4 clusters (gains)\n{hist1!r}')
 ax[0].legend()
-ax[1].set_title('ConstraintKMeans 4 clusters (distances)\n%r' % hist2)
+ax[1].set_title(f'ConstraintKMeans 4 clusters (distances)\n{hist2!r}')
 ax[1].legend()
 
 
@@ -129,7 +129,7 @@ def plot_delaunay(ax, edges, points):
     x = [km.cluster_centers_[i, 0], km.cluster_centers_[i, 0]]
     y = [km.cluster_centers_[i, 1], km.cluster_centers_[i, 1]]
     ax[0].plot(x, y, colors[i] + '+')
-ax[0].set_title("ConstraintKMeans 4 clusters\nstrategy='weights'\n%r" % hist)
+ax[0].set_title(f"ConstraintKMeans 4 clusters\nstrategy='weights'\n{hist!r}")
 ax[0].legend()
 
 cls = km.cluster_centers_iter_

diff --git a/_unittests/ut_documentation/test_nb_search_keras.py b/_unittests/ut_documentation/test_nb_search_keras.py
@@ -31,8 +31,7 @@ def test_notebook_search_images(self):
             except (SyntaxError, ModuleNotFoundError, AttributeError,
                     ImportError) as e:
                 warnings.warn(
-                    "tensorflow is probably not available yet on python 3.7: "
-                    "{0}".format(e))
+                    f"tensorflow is probably not available yet on python 3.7: {e}")
                 return
 
         self.assertTrue(mlinsights is not None)

diff --git a/_unittests/ut_plotting/test_plot_gallery.py b/_unittests/ut_plotting/test_plot_gallery.py
@@ -57,7 +57,7 @@ def test_plot_gallery_url(self):
         try:
             fig, ax = plot_gallery_images(files, return_figure=True)
         except http.client.RemoteDisconnected as e:
-            warnings.warn("Unable to fetch image {0}'".format(e))
+            warnings.warn(f"Unable to fetch image {e}'")
             return
         img = os.path.join(temp, "gallery.png")
         fig.savefig(img)
@@ -68,7 +68,7 @@ def test_plot_gallery_url(self):
             ax = plot_gallery_images(files, return_figure=False, ax=ax)
             self.assertNotEmpty(ax)
         except http.client.RemoteDisconnected as e:
-            warnings.warn("Unable to fetch image {0}'".format(e))
+            warnings.warn(f"Unable to fetch image {e}'")
             return
 
 

diff --git a/_unittests/ut_search_rank/test_LONG_search_images_keras.py b/_unittests/ut_search_rank/test_LONG_search_images_keras.py
@@ -31,7 +31,7 @@ def test_search_predictions_keras(self):
             except (SyntaxError, ModuleNotFoundError, AttributeError,
                     ImportError) as e:
                 warnings.warn(
-                    "Issue with tensorflow or keras: {0}".format(e))
+                    f"Issue with tensorflow or keras: {e}")
                 return
             from keras.preprocessing.image import ImageDataGenerator  # pylint: disable=E0401,E0611
             from keras.preprocessing.image import img_to_array, load_img  # pylint: disable=E0401,E0611

diff --git a/_unittests/ut_search_rank/test_LONG_search_images_torch.py b/_unittests/ut_search_rank/test_LONG_search_images_torch.py
@@ -32,7 +32,7 @@ def test_search_predictions_torch(self):
                 import torchvision.models as tmodels  # pylint: disable=E0401,C0415
             except (SyntaxError, ModuleNotFoundError) as e:
                 warnings.warn(
-                    "torch is not available: {0}".format(e))
+                    f"torch is not available: {e}")
                 return
             from torchvision import datasets, transforms  # pylint: disable=E0401
             from torch.utils.data import DataLoader  # pylint: disable=E0401

diff --git a/mlinsights/helpers/parameters.py b/mlinsights/helpers/parameters.py
@@ -13,7 +13,7 @@ def format_value(v):
     @return                 a string
     """
     return ("'{0}'".format(v.replace("'", "\\'"))
-            if isinstance(v, str) else "{0}".format(v))
+            if isinstance(v, str) else f"{v}")
 
 
 def format_parameters(pdict):
@@ -33,7 +33,7 @@ def format_parameters(pdict):
     """
     res = []
     for k, v in sorted(pdict.items()):
-        res.append('{0}={1}'.format(k, format_value(v)))
+        res.append(f'{k}={format_value(v)}')
     return ", ".join(res)
 
 
@@ -52,5 +52,5 @@ def format_function_call(name, pdict):
         d = dict(i=2, x=6.7, s="r")
         print(format_function_call("fct", d))
     """
-    res = '{0}({1})'.format(name, format_parameters(pdict))
+    res = f'{name}({format_parameters(pdict)})'
     return "\n".join(textwrap.wrap(res, width=70, subsequent_indent='    '))
diff --git a/mlinsights/helpers/pipeline.py b/mlinsights/helpers/pipeline.py
@@ -71,7 +71,7 @@ class PassThrough:
             pass
         else:
             raise TypeError(  # pragma: no cover
-                "pipe is not a scikit-learn object: {}\n{}".format(type(pipe), pipe))
+                f"pipe is not a scikit-learn object: {type(pipe)}\n{pipe}")
 
 
 class BaseEstimatorDebugInformation:
@@ -112,8 +112,7 @@ def to_str(self, nrows=5):
         """
         Tries to produce a readable message.
         """
-        rows = ['BaseEstimatorDebugInformation({})'.format(
-            self.model.__class__.__name__)]
+        rows = [f'BaseEstimatorDebugInformation({self.model.__class__.__name__})']
         for k in sorted(self.inputs):
             if k in self.outputs:
                 rows.append('  ' + k + '(')
@@ -126,7 +125,7 @@ def to_str(self, nrows=5):
                 rows.append('  )')
             else:
                 raise KeyError(  # pragma: no cover
-                    "Unable to find output for method '{}'.".format(k))
+                    f"Unable to find output for method '{k}'.")
         return "\n".join(rows)
 
     def display(self, data, nrows):
@@ -139,9 +138,9 @@ def display(self, data, nrows):
             rows = rows[:nrows]
             rows.append('...')
         if hasattr(data, 'shape'):
-            rows.insert(0, "shape=%r type=%r" % (data.shape, type(data)))
+            rows.insert(0, f"shape={data.shape!r} type={type(data)!r}")
         else:
-            rows.insert(0, "type=%r" % type(data))  # pragma: no cover
+            rows.insert(0, f"type={type(data)!r}")  # pragma: no cover
         return "\n".join(rows)
 
 

diff --git a/mlinsights/metrics/correlations.py b/mlinsights/metrics/correlations.py
@@ -126,13 +126,13 @@ def non_linear_correlations(df, model, draws=5, minmax=False):
                 xj_test = df_test[:, j:j + 1]
                 if len(xj_test) == 0 or len(xi_test) == 0:
                     raise ValueError(  # pragma: no cover
-                        "One column is empty i={0} j={1}.".format(i, j))
+                        f"One column is empty i={i} j={j}.")
                 mod = clone(model)
                 try:
                     mod.fit(xi_train, xj_train.ravel())
                 except Exception as e:  # pragma: no cover
                     raise ValueError(
-                        "Unable to compute correlation for i={0} j={1}.".format(i, j)) from e
+                        f"Unable to compute correlation for i={i} j={j}.") from e
                 v = mod.predict(xi_test)
                 c = (1 - numpy.var(v - xj_test.ravel()))
                 co = max(c, 0) ** 0.5

diff --git a/mlinsights/mlbatch/cache_model.py b/mlinsights/mlbatch/cache_model.py
@@ -31,7 +31,7 @@ def cache(self, params, value):
         key = MLCache.as_key(params)
         if key in self.cached:
             raise KeyError(  # pragma: no cover
-                "Key {0} already exists".format(params))
+                f"Key {params} already exists")
         self.cached[key] = value
         self.count_[key] = 0
 
@@ -77,7 +77,7 @@ def as_key(params):
             elif isinstance(v, tuple):
                 if not all(map(lambda e: isinstance(e, (int, float, str)), v)):
                     raise TypeError(  # pragma: no cover
-                        "Unable to create a key with value '{0}':{1}".format(k, v))
+                        f"Unable to create a key with value '{k}':{v}")
                 return str(v)
             elif isinstance(v, numpy.ndarray):
                 # id(v) may have been better but
@@ -87,7 +87,7 @@ def as_key(params):
                 sv = ""
             else:
                 raise TypeError(  # pragma: no cover
-                    "Unable to create a key with value '{0}':{1}".format(k, v))
+                    f"Unable to create a key with value '{k}':{v}")
             els.append((k, sv))
         return str(els)
 
@@ -122,7 +122,7 @@ def create_cache(name):
         global _caches  # pylint: disable=W0603,W0602
         if name in _caches:
             raise RuntimeError(  # pragma: no cover
-                "cache '{0}' already exists.".format(name))
+                f"cache '{name}' already exists.")
 
         cache = MLCache(name)
         _caches[name] = cache

diff --git a/mlinsights/mlmodel/_kmeans_022.py b/mlinsights/mlmodel/_kmeans_022.py
@@ -45,7 +45,7 @@ def _labels_inertia_precompute_dense(norm, X, sample_weight, centers, distances)
             X=X, Y=centers, metric='manhattan')
     else:  # pragma no cover
         raise NotImplementedError(
-            "Not implemented for norm '{}'.".format(norm))
+            f"Not implemented for norm '{norm}'.")
     # cython k-means code assumes int32 inputs
     labels = labels.astype(numpy.int32, copy=False)
     if n_samples == distances.shape[0]:

diff --git a/mlinsights/mlmodel/_kmeans_constraint_.py b/mlinsights/mlmodel/_kmeans_constraint_.py
@@ -47,7 +47,7 @@ def linearize_matrix(mat, *adds):
                     res[i, k + 3] = am[a, b]
             return res
         raise NotImplementedError(  # pragma: no cover
-            "This kind of sparse matrix is not handled: {0}".format(type(mat)))
+            f"This kind of sparse matrix is not handled: {type(mat)}")
     else:
         n = mat.shape[0]
         c = mat.shape[1]
@@ -91,7 +91,7 @@ def constraint_kmeans(X, labels, sample_weight, centers, inertia,
     """
     if labels.dtype != numpy.int32:
         raise TypeError(  # pragma: no cover
-            "Labels must be an array of int not '{0}'".format(labels.dtype))
+            f"Labels must be an array of int not '{labels.dtype}'")
 
     if strategy == 'weights':
         return _constraint_kmeans_weights(
@@ -222,8 +222,7 @@ def _constraint_association(leftover, counters, labels, leftclose, distances_clo
         return _constraint_association_gain(
             leftover, counters, labels, leftclose, distances_close,
             centers, X, x_squared_norms, limit, strategy, state=state)
-    raise ValueError("Unknwon strategy '{0}'.".format(
-        strategy))  # pragma: no cover
+    raise ValueError(f"Unknwon strategy '{strategy}'.")  # pragma: no cover
 
 
 def _compute_strategy_coefficient(distances, strategy, labels):
@@ -235,7 +234,7 @@ def _compute_strategy_coefficient(distances, strategy, labels):
         dist = distances[ar, labels]
         return distances - dist[:, numpy.newaxis]
     raise ValueError(  # pragma: no cover
-        "Unknwon strategy '{0}'.".format(strategy))
+        f"Unknwon strategy '{strategy}'.")
 
 
 def _randomize_index(index, weights):
@@ -479,7 +478,7 @@ def loopf(h, sumi):
     neg = (counters < ave).sum()
     if neg > 0:
         raise RuntimeError(  # pragma: no cover
-            "The algorithm failed, counters={0}".format(counters))
+            f"The algorithm failed, counters={counters}")
 
     _switch_clusters(labels, distances)
     distances_close[:] = distances[numpy.arange(X.shape[0]), labels]
@@ -540,7 +539,7 @@ def _constraint_kmeans_weights(X, labels, sample_weight, centers, inertia, it,
         if len(set(labels)) != centers.shape[0]:
             if verbose and fLOG:  # pragma: no cover
                 if isinstance(verbose, int) and verbose >= 10:
-                    fLOG("CKMeans new weights: w=%r" % weights)
+                    fLOG(f"CKMeans new weights: w={weights!r}")
                 else:
                     fLOG("CKMeans new weights")
             weights[:] = 1

diff --git a/mlinsights/mlmodel/categories_to_integers.py b/mlinsights/mlmodel/categories_to_integers.py
@@ -73,7 +73,7 @@ def fit(self, X, y=None, **fit_params):
         """
         if not isinstance(X, pandas.DataFrame):
             raise TypeError(  # pragma: no cover
-                "this transformer only accept Dataframes, not {0}".format(type(X)))
+                f"this transformer only accept Dataframes, not {type(X)}")
         if self.columns:
             columns = self.columns
         else:
@@ -89,7 +89,7 @@ def fit(self, X, y=None, **fit_params):
             nb = len(distinct)
             if nb >= max_cat:
                 raise ValueError(  # pragma: no cover
-                    "Too many categories ({0}) for one column '{1}' max_cat={2}".format(nb, c, max_cat))
+                    f"Too many categories ({nb}) for one column '{c}' max_cat={max_cat}")
             self._categories[c] = dict((c, i)
                                        for i, c in enumerate(list(sorted(distinct))))
         self._schema = self._build_schema()
@@ -107,7 +107,7 @@ def _build_schema(self):
         new_vector = {}
         last = 0
         for c, v in self._categories.items():
-            sch = [(_[1], "{0}={1}".format(c, _[1]))
+            sch = [(_[1], f"{c}={_[1]}")
                    for _ in sorted((n, d) for d, n in v.items())]
             if self.remove:
                 sch = [d for d in sch if d[1] not in self.remove]
@@ -133,7 +133,7 @@ def transform(self, X, y=None, **fit_params):
         """
         if not isinstance(X, pandas.DataFrame):
             raise TypeError(  # pragma: no cover
-                "X is not a dataframe: {0}".format(type(X)))
+                f"X is not a dataframe: {type(X)}")
 
         if self.single:
             b = not self.skip_errors

diff --git a/mlinsights/mlmodel/classification_kmeans.py b/mlinsights/mlmodel/classification_kmeans.py
@@ -156,7 +156,7 @@ def set_params(self, **values):
                 pc[k[2:]] = v
             else:
                 raise ValueError(  # pragma: no cover
-                    "Unexpected parameter name '{0}'".format(k))
+                    f"Unexpected parameter name '{k}'")
         self.clus.set_params(**pc)
         self.estimator.set_params(**pe)
 
@@ -165,8 +165,8 @@ def __repr__(self):  # pylint: disable=W0222
         Overloads `repr` as *scikit-learn* now relies
         on the constructor signature.
         """
-        el = ', '.join(['%s=%r' % (k, v)
+        el = ', '.join([f'{k}={v!r}'
                         for k, v in self.get_params().items()])
-        text = "%s(%s)" % (self.__class__.__name__, el)
+        text = f"{self.__class__.__name__}({el})"
         lines = textwrap.wrap(text, subsequent_indent='    ')
         return "\n".join(lines)
diff --git a/mlinsights/mlmodel/decision_tree_logreg.py b/mlinsights/mlmodel/decision_tree_logreg.py
@@ -409,7 +409,7 @@ def fit(self, X, y, sample_weight=None):
         if self.strategy == 'perpendicular':
             return self._fit_perpendicular(X, y, sample_weight)
         raise ValueError(
-            "Unknown strategy '{}'.".format(self.strategy))
+            f"Unknown strategy '{self.strategy}'.")
 
     def _fit_parallel(self, X, y, sample_weight):
         "Implements the parallel strategy."

diff --git a/mlinsights/mlmodel/extended_features.py b/mlinsights/mlmodel/extended_features.py
@@ -60,7 +60,7 @@ def get_feature_names(self, input_features=None):
         if self.kind == 'poly-slow':
             return self._get_feature_names_poly(input_features)
         raise ValueError(  # pragma: no cover
-            "Unknown extended features '{}'.".format(self.kind))
+            f"Unknown extended features '{self.kind}'.")
 
     def _get_feature_names_poly(self, input_features=None):
         """
@@ -72,8 +72,7 @@ def _get_feature_names_poly(self, input_features=None):
                               i for i in range(0, self.n_input_features_)]
         elif len(input_features) != self.n_input_features_:
             raise ValueError(  # pragma: no cover
-                "input_features should contain {} strings.".format(
-                    self.n_input_features_))
+                f"input_features should contain {self.n_input_features_} strings.")
 
         names = ["1"] if self.poly_include_bias else []
         n = self.n_input_features_
@@ -126,7 +125,7 @@ def fit(self, X, y=None):
         elif self.kind == 'poly-slow':
             return self._fit_poly(X, y)
         raise ValueError(  # pragma: no cover
-            "Unknown extended features '{}'.".format(self.kind))
+            f"Unknown extended features '{self.kind}'.")
 
     def _fit_poly(self, X, y=None):
         """
@@ -155,7 +154,7 @@ def transform(self, X):
         if self.kind == 'poly-slow':
             return self._transform_poly_slow(X)
         raise ValueError(  # pragma: no cover
-            "Unknown extended features '{}'.".format(self.kind))
+            f"Unknown extended features '{self.kind}'.")
 
     def _transform_poly(self, X):
         """

diff --git a/mlinsights/mlmodel/kmeans_constraint.py b/mlinsights/mlmodel/kmeans_constraint.py
@@ -85,8 +85,7 @@ def __init__(self, n_clusters=8, init='k-means++', n_init=10, max_iter=500,
         self.history = history
         self.learning_rate = learning_rate
         if strategy not in ConstraintKMeans._strategy_value:
-            raise ValueError('strategy must be in {0}'.format(
-                ConstraintKMeans._strategy_value))
+            raise ValueError(f'strategy must be in {ConstraintKMeans._strategy_value}')
 
     def fit(self, X, y=None, sample_weight=None, fLOG=None):
         """