raphaelvallat · kschuerholt · Jan 21, 2022 · Jun 20, 2022 · Jun 20, 2022 · raphaelvallat
diff --git a/pingouin/nonparametric.py b/pingouin/nonparametric.py
@@ -152,7 +152,8 @@ def madmedianrule(a):
     return (np.fabs(a - np.median(a)) / mad(a)) > k
 
 
-def mwu(x, y, alternative="two-sided", **kwargs):
+def mwu(x, y, alternative="two-sided", confidence=0.95, **kwargs):
+
     """Mann-Whitney U Test (= Wilcoxon rank-sum test). It is the non-parametric
     version of the independent T-test.
 
@@ -165,6 +166,8 @@ def mwu(x, y, alternative="two-sided", **kwargs):
         Defines the alternative hypothesis, or tail of the test. Must be one of
         "two-sided" (default), "greater" or "less". See :py:func:`scipy.stats.mannwhitneyu` for
         more details.
+    confidence : float
+        Confidence level on confidence interval of difference of medians between x and y.
     **kwargs : dict
         Additional keywords arguments that are passed to :py:func:`scipy.stats.mannwhitneyu`.
 
@@ -177,6 +180,7 @@ def mwu(x, y, alternative="two-sided", **kwargs):
         * ``'p-val'``: p-value
         * ``'RBC'``   : rank-biserial correlation
         * ``'CLES'``  : common language effect size
+        * ``'CI'``  : confidence interval of difference of medians
 
     See also
     --------
@@ -230,16 +234,20 @@ def mwu(x, y, alternative="two-sided", **kwargs):
         Association and the American Statistical Association, 25(2),
         101–132. https://doi.org/10.2307/1165329
 
+    .. [5] Campbell, M. J. & Gardner, M. J. (1988). Calculating confidence
+           intervals for some non-parametric analyses.
+           British Medical Journal Volume 226, 1988.
+
     Examples
     --------
     >>> import numpy as np
     >>> import pingouin as pg
     >>> np.random.seed(123)
     >>> x = np.random.uniform(low=0, high=1, size=20)
     >>> y = np.random.uniform(low=0.2, high=1.2, size=20)
-    >>> pg.mwu(x, y, alternative='two-sided')
-         U-val alternative    p-val    RBC    CLES
-    MWU   97.0   two-sided  0.00556  0.515  0.2425
+    >>> pg.mwu(x, y, alternative='two-sided',confidence=0.95)
+         U-val alternative    p-val    RBC    CLES     CI95%
+    MWU   97.0   two-sided  0.00556  0.515  0.2425     [-0.39290395101879694, -0.09400270319896187]
 
     Compare with SciPy
 
@@ -249,19 +257,19 @@ def mwu(x, y, alternative="two-sided", **kwargs):
 
     One-sided test
 
-    >>> pg.mwu(x, y, alternative='greater')
-         U-val alternative     p-val    RBC    CLES
-    MWU   97.0     greater  0.997442  0.515  0.2425
+    >>> pg.mwu(x, y, alternative='greater',confidence=0.95)
+         U-val alternative     p-val    RBC    CLES    CI95%
+    MWU   97.0     greater  0.997442  0.515  0.2425    [-0.3711286134873304, inf]
 
-    >>> pg.mwu(x, y, alternative='less')
-         U-val alternative    p-val    RBC    CLES
-    MWU   97.0        less  0.00278  0.515  0.7575
+    >>> pg.mwu(x, y, alternative='less',confidence=0.95)
+         U-val alternative    p-val    RBC    CLES     CI95%
+    MWU   97.0        less  0.00278  0.515  0.7575     [-inf, -0.10192641647044609]
 
     Passing keyword arguments to :py:func:`scipy.stats.mannwhitneyu`:
 
-    >>> pg.mwu(x, y, alternative='two-sided', method='exact')
-         U-val alternative     p-val    RBC    CLES
-    MWU   97.0   two-sided  0.004681  0.515  0.2425
+    >>> pg.mwu(x, y, alternative='two-sided',confidence=0.95, method='exact')
+         U-val alternative     p-val    RBC    CLES    CI95%
+    MWU   97.0   two-sided  0.004681  0.515  0.2425    [-0.39290395101879694, -0.09400270319896187]
     """
     x = np.asarray(x)
     y = np.asarray(y)
@@ -294,6 +302,24 @@ def mwu(x, y, alternative="two-sided", **kwargs):
     # Effect size 2: rank biserial correlation (Wendt 1972)
     rbc = 1 - (2 * uval) / diff.size  # diff.size = x.size * y.size
 
+    # Confidence interval for the (difference in) medians
+    # Campbell and Gardner 2000
+    if alternative == "two-sided":
+        alpha = 1.0 - confidence
+        conf = 1.0 - alpha / 2  # 0.975
+    else:
+        conf = confidence
+    N = scipy.stats.norm.ppf(conf)
+    ct1, ct2 = len(x), len(y)  # count samples
+    diffs = sorted([i - j for i in x for j in y])  # get ct1xct2 difference
+    k = int(round(ct1 * ct2 / 2 - (N * (ct1 * ct2 * (ct1 + ct2 + 1) / 12) ** 0.5)))
+    ci = [diffs[k], diffs[len(diffs) - k]]
+    if alternative == "greater":
+        ci[1] = np.inf
+    elif alternative == "less":
+        ci[0] = -np.inf
+    # Rename CI
+    ci_name = "CI%.0f%%" % (100 * confidence)
     # Fill output DataFrame
     stats = pd.DataFrame(
         {"U-val": uval, "alternative": alternative, "p-val": pval, "RBC": rbc, "CLES": cles},