scikit-hep · HDembinski · Feb 2, 2022 · Feb 1, 2022
diff --git a/src/resample/permutation.py b/src/resample/permutation.py
@@ -360,46 +360,6 @@ def anova(
     return same_population(_ANOVA(), x, y, *args, **kwargs)
 
 
-def mannwhitneyu(x: _ArrayLike, y: _ArrayLike, **kwargs: _Kwargs) -> TestResult:
-    """
-    Test whether two samples are drawn from the same population based on ranking.
-
-    This performs the permutation-based Mann-Whitney U test, see for details. The test
-    works for any population of samples that are ordinal, so also for integers. This is
-    the two-sided version of the test, meaning that the test gives the same p-value if
-    x and y are swapped.
-
-    For normally distributed data, the test is almost as powerful as the t-test and
-    considerably more powerful for non-normal populations. The t-test tests whether two
-    samples have the same mean and ignores differences in variance, while the
-    Mann-Whitney U test also detects differences in variance.
-
-    Parameters
-    ----------
-    x : array-like
-        First sample.
-    y : array-like
-        Second sample.
-    **kwargs :
-        Keyword arguments are forward to :meth:`same_population`.
-    **kwargs :
-        Keyword arguments are forward to :meth:`same_population`.
-
-    Returns
-    -------
-    TestResult
-
-    Notes
-    -----
-    https://en.wikipedia.org/wiki/Mann%E2%80%93Whitney_U_test
-    """
-    n1 = len(x)
-    n2 = len(y)
-    mu = n1 * n2 // 2
-    kwargs["transform"] = lambda x: np.abs(x - mu)
-    return same_population(_mannwhitneyu, x, y, **kwargs)
-
-
 def kruskal(
     x: _ArrayLike, y: _ArrayLike, *args: _ArrayLike, **kwargs: _Kwargs
 ) -> TestResult:
@@ -526,16 +486,6 @@ def _ttest(x: np.ndarray, y: np.ndarray) -> float:
     return r
 
 
-def _mannwhitneyu(x: np.ndarray, y: np.ndarray) -> float:
-    # method 2 from Wikipedia, but returning U1 instead of min(U1, U2) to be
-    # consistent with scipy.stats.mannwhitneyu(x, y, alternative="two-sided")
-    n1 = len(x)
-    a = _rankdata(np.concatenate([x, y]))
-    r1 = np.sum(a[:n1])
-    u1: float = r1 - 0.5 * n1 * (n1 + 1)
-    return u1
-
-
 def _pearson(x: np.ndarray, y: np.ndarray) -> float:
     m1 = np.mean(x)
     m2 = np.mean(y)

diff --git a/tests/test_permutation.py b/tests/test_permutation.py
@@ -62,7 +62,6 @@ def __getitem__(self, key):
 
 scipy = Scipy(
     anova=stats.f_oneway,
-    mannwhitneyu=lambda x, y: stats.mannwhitneyu(x, y, alternative="two-sided"),
     ttest=lambda x, y: stats.ttest_ind(x, y, equal_var=False),
 )
 
@@ -71,7 +70,6 @@ def __getitem__(self, key):
     "test_name",
     (
         "anova",
-        "mannwhitneyu",
         "kruskal",
         "pearsonr",
         "spearmanr",
@@ -97,7 +95,6 @@ def test_two_sample_same_size(test_name, size, rng):
     "test_name",
     (
         "anova",
-        "mannwhitneyu",
         "kruskal",
         "pearsonr",
         "spearmanr",