matplotlib · ghost · May 7, 2017 · May 7, 2017 · May 7, 2017 · May 7, 2017
diff --git a/lib/matplotlib/axes/_axes.py b/lib/matplotlib/axes/_axes.py
@@ -88,6 +88,26 @@ def _plot_args_replacer(args, data):
                          "multiple plotting calls instead.")
 
 
+class ViolinStatFunc:
+    """
+    The :class:`ViolinStatFunc` contains:
+    1) a callable whose first argument is compulsory and is a 1-d list of data
+    that is used to plot the violin. This first argument is not required to be
+    specified.
+    2) an alias for this callable. When violinplot outputs the dictionary of
+    artists, this alias is used to identify the artist object corresponding to
+    this callable
+    3) a list of additional arguments. This list does not contain the
+    aforementioned compulsory 1-d list of data.
+    """
+    def __init__(self, func_callable, **kargs):
+        self.func_callable = func_callable
+        self.alias = kargs.pop('alias', func_callable.__name__)
+        self.optional_args = kargs.pop('args', [])
+        if not isinstance(self.optional_args, list):
+            raise ValueError('args has to be a list')
+
+
 # The axes module contains all the wrappers to plotting functions.
 # All the other methods should go in the _AxesBase class.
 
@@ -7277,7 +7297,7 @@ def matshow(self, Z, **kwargs):
     @_preprocess_data(replace_names=["dataset"], label_namer=None)
     def violinplot(self, dataset, positions=None, vert=True, widths=0.5,
                    showmeans=False, showextrema=True, showmedians=False,
-                   points=100, bw_method=None):
+                   points=100, bw_method=None, statistics_function_list=[]):
         """
         Make a violin plot.
 
@@ -7324,6 +7344,13 @@ def violinplot(self, dataset, positions=None, vert=True, widths=0.5,
           callable, it should take a `GaussianKDE` instance as its only
           parameter and return a scalar. If None (default), 'scott' is used.
 
+        statistics_function_list: a list of callable or ViolinStatFunc. The
+        element of this list can be any custom summary statistics to be
+        displayed on the voilin plot (with one constraint that the first
+        argument of these function has to be the input data of violin plot
+        i.e. dataset if dataset is 1-d or an element of dataset if dataset is
+        2-d)
+
         Returns
         -------
 
@@ -7369,12 +7396,44 @@ def _kde_method(X, coords):
             kde = mlab.GaussianKDE(X, bw_method)
             return kde.evaluate(coords)
 
-        vpstats = cbook.violin_stats(dataset, _kde_method, points=points)
-        return self.violin(vpstats, positions=positions, vert=vert,
+        def _resolve_duplicate_alias(func_obj_list):
+            unique_alias_set = set()
+            for func_obj in func_obj_list:
+                while func_obj.alias in unique_alias_set:
+                    func_obj.alias += 'x'
+                unique_alias_set.add(func_obj.alias)
+
+        violin_stat_func_obj_list = []
+        for func in statistics_function_list:
+            if not isinstance(func, ViolinStatFunc):
+                if callable(func):
+                    violin_stat_func_obj_list.append(ViolinStatFunc(func))
+                else:
+                    raise ValueError(
+                        'Optional argument has to be a callable' +
+                        'or a ViolinStatFunc object')
+            else:
+                violin_stat_func_obj_list.append(func)
+
+        custom_stat_alias_list = [func_obj.alias for func_obj in
+                                  violin_stat_func_obj_list]
+        if len(custom_stat_alias_list) > len(set(custom_stat_alias_list)):
+            _resolve_duplicate_alias(violin_stat_func_obj_list)
+            # remake alias list based on updated unique aliases
+            custom_stat_alias_list = [func_obj.alias for func_obj in
+                                      violin_stat_func_obj_list]
+
+        vpstats, custom_stat_vals = \
+            cbook.violin_stats(dataset, _kde_method,
+                               violin_stat_func_obj_list, points=points)
+
+        return self.violin(vpstats, custom_stat_vals, custom_stat_alias_list,
+                           positions=positions, vert=vert,
                            widths=widths, showmeans=showmeans,
                            showextrema=showextrema, showmedians=showmedians)
 
-    def violin(self, vpstats, positions=None, vert=True, widths=0.5,
+    def violin(self, vpstats, custom_stat_vals, custom_stat_alias_list,
+               positions=None, vert=True, widths=0.5,
                showmeans=False, showextrema=True, showmedians=False):
         """Drawing function for violin plots.
 
@@ -7511,7 +7570,9 @@ def violin(self, vpstats, positions=None, vert=True, widths=0.5,
 
         # Render violins
         bodies = []
-        for stats, pos, width in zip(vpstats, positions, widths):
+        custom_vals = {}
+        for stats, pos, width, stat_val_dict in zip(vpstats, positions,
+                                                    widths, custom_stat_vals):
             # The 0.5 factor reflects the fact that we plot from v-p to
             # v+p
             vals = np.array(stats['vals'])
@@ -7525,6 +7586,11 @@ def violin(self, vpstats, positions=None, vert=True, widths=0.5,
             mins.append(stats['min'])
             maxes.append(stats['max'])
             medians.append(stats['median'])
+            for alias in custom_stat_alias_list:
+                if alias not in custom_vals:
+                    custom_vals[alias] = []
+                custom_vals[alias].append(stat_val_dict[alias])
+
         artists['bodies'] = bodies
 
         # Render means
@@ -7547,6 +7613,12 @@ def violin(self, vpstats, positions=None, vert=True, widths=0.5,
                                              pmins,
                                              pmaxes,
                                              colors=edgecolor)
+        # Render custom statistics
+        for alias in custom_stat_alias_list:
+            artists['custom_' + alias] = perp_lines(custom_vals[alias],
+                                                    pmins,
+                                                    pmaxes,
+                                                    colors=edgecolor)
 
         return artists
 

diff --git a/lib/matplotlib/cbook/__init__.py b/lib/matplotlib/cbook/__init__.py
@@ -2001,13 +2001,13 @@ def _reshape_2D(X, name):
         raise ValueError("{} must have 2 or fewer dimensions".format(name))
 
 
-def violin_stats(X, method, points=100):
+def violin_stats(X, method, custom_stat_func_obj, points=100):
     """
     Returns a list of dictionaries of data which can be used to draw a series
     of violin plots. See the `Returns` section below to view the required keys
-    of the dictionary. Users can skip this function and pass a user-defined set
-    of dictionaries to the `axes.vplot` method instead of using MPL to do the
-    calculations.
+    of the dictionary. Users can skip this function and pass a user-defined
+    set of dictionaries to the `axes.vplot` method instead of using MPL to do
+    the calculations.
 
     Parameters
     ----------
@@ -2021,35 +2021,41 @@ def violin_stats(X, method, points=100):
         return a vector of the values of the KDE evaluated at the values
         specified in coords.
 
+    custom_stat_func_obj : a list of ViolinStatFunc object, each containing a
+    custom statistics to be drawn on the violin plot
+
     points : scalar, default = 100
-        Defines the number of points to evaluate each of the gaussian kernel
-        density estimates at.
+    Defines the number of points to evaluate each of the gaussian kernel
+    density estimates at.
 
     Returns
     -------
 
-    A list of dictionaries containing the results for each column of data.
-    The dictionaries contain at least the following:
+    Two lists of dictionaries containing the results for each column of data.
+    The first list of dictionaries contain at least the following:
 
-        - coords: A list of scalars containing the coordinates this particular
-          kernel density estimate was evaluated at.
-        - vals: A list of scalars containing the values of the kernel density
-          estimate at each of the coordinates given in `coords`.
-        - mean: The mean value for this column of data.
-        - median: The median value for this column of data.
-        - min: The minimum value for this column of data.
-        - max: The maximum value for this column of data.
+    - coords: A list of scalars containing the coordinates this particular
+    kernel density estimate was evaluated at.
+    - vals: A list of scalars containing the values of the kernel density
+    estimate at each of the coordinates given in `coords`.
+    - mean: The mean value for this column of data.
+    - median: The median value for this column of data.
+    - min: The minimum value for this column of data.
+    - max: The maximum value for this column of data.
+    The second list of dictionaries contains the results for each column of 
+    data computed from the custom each of the statistics function
     """
-
     # List of dictionaries describing each of the violins.
     vpstats = []
+    custom_stat_vals = []
 
     # Want X to be a list of data sequences
     X = _reshape_2D(X, "X")
 
     for x in X:
         # Dictionary of results for this distribution
         stats = {}
+        stats2 = {}
 
         # Calculate basic stats for the distribution
         min_val = np.min(x)
@@ -2065,11 +2071,15 @@ def violin_stats(X, method, points=100):
         stats['median'] = np.median(x)
         stats['min'] = min_val
         stats['max'] = max_val
+        for func_obj in custom_stat_func_obj:
+            stats2[func_obj.alias] = \
+                func_obj.func_callable(x, *func_obj.optional_args)
 
         # Append to output
         vpstats.append(stats)
+        custom_stat_vals.append(stats2)
 
-    return vpstats
+    return vpstats, custom_stat_vals
 
 
 class _NestedClassGetter(object):

diff --git a/...lotlib/tests/baseline_images/test_axes/violinplot_horiz_show95_5percentiles.png b/...lotlib/tests/baseline_images/test_axes/violinplot_horiz_show95_5percentiles.png
diff --git a/lib/matplotlib/tests/baseline_images/test_axes/violinplot_horiz_showstdev.png b/lib/matplotlib/tests/baseline_images/test_axes/violinplot_horiz_showstdev.png
diff --git a/...lotlib/tests/baseline_images/test_axes/violinplot_vert_show80_20percentiles.png b/...lotlib/tests/baseline_images/test_axes/violinplot_vert_show80_20percentiles.png
diff --git a/lib/matplotlib/tests/baseline_images/test_axes/violinplot_vert_showstdev.png b/lib/matplotlib/tests/baseline_images/test_axes/violinplot_vert_showstdev.png
diff --git a/lib/matplotlib/tests/test_axes.py b/lib/matplotlib/tests/test_axes.py
@@ -2329,7 +2329,8 @@ def test_vert_violinplot_baseline():
                   showmedians=0, data=data)
 
 
-@image_comparison(baseline_images=['violinplot_vert_showmeans'],
+@image_comparison(baseline_images=['violinplot_vert_showmeans',
+                                   'violinplot_vert_showmeans'],
                   extensions=['png'])
 def test_vert_violinplot_showmeans():
     ax = plt.axes()
@@ -2338,6 +2339,11 @@ def test_vert_violinplot_showmeans():
     data = [np.random.normal(size=100) for i in range(4)]
     ax.violinplot(data, positions=range(4), showmeans=1, showextrema=0,
                   showmedians=0)
+    fig, ax = plt.subplots()
+    ax = plt.axes()
+    ax.violinplot(data, statistics_function_list=[np.mean],
+                  positions=range(4), showmeans=0, showextrema=0,
+                  showmedians=0)
 
 
 @image_comparison(baseline_images=['violinplot_vert_showextrema'],
@@ -2351,7 +2357,8 @@ def test_vert_violinplot_showextrema():
                   showmedians=0)
 
 
-@image_comparison(baseline_images=['violinplot_vert_showmedians'],
+@image_comparison(baseline_images=['violinplot_vert_showmedians',
+                                   'violinplot_vert_showmedians'],
                   extensions=['png'])
 def test_vert_violinplot_showmedians():
     ax = plt.axes()
@@ -2360,6 +2367,11 @@ def test_vert_violinplot_showmedians():
     data = [np.random.normal(size=100) for i in range(4)]
     ax.violinplot(data, positions=range(4), showmeans=0, showextrema=0,
                   showmedians=1)
+    fig, ax = plt.subplots()
+    ax = plt.axes()
+    ax.violinplot(data, statistics_function_list=[np.median],
+                  positions=range(4), showmeans=0, showextrema=0,
+                  showmedians=0)
 
 
 @image_comparison(baseline_images=['violinplot_vert_showall'],
@@ -2395,6 +2407,31 @@ def test_vert_violinplot_custompoints_200():
                   showmedians=0, points=200)
 
 
+@image_comparison(baseline_images=['violinplot_vert_showstdev',
+                                   'violinplot_vert_show80_20percentiles'],
+                  extensions=['png'])
+def test_vert_violinplot_showcustomstat():
+    ax = plt.axes()
+    # First 9 digits of frac(sqrt(31))
+    np.random.seed(567764362)
+    data = [np.random.normal(size=100) for i in range(4)]
+    func_list = [lambda x: np.mean(x) + np.std(x),
+                 lambda x: np.mean(x) - np.std(x)]
+    ax.violinplot(data, statistics_function_list=func_list,
+                  positions=range(4), showmeans=0,
+                  showextrema=0, showmedians=0)
+    fig, ax = plt.subplots()
+    ax = plt.axes()
+    from matplotlib.axes._axes import ViolinStatFunc
+    percentile95 = ViolinStatFunc(np.percentile,
+                                  alias='95 percentile', args=[80])
+    percentile5 = ViolinStatFunc(np.percentile,
+                                 alias='5 percentile', args=[20])
+    ax.violinplot(data, statistics_function_list=[percentile95, percentile5],
+                  positions=range(4), showmeans=0,
+                  showextrema=0, showmedians=0)
+
+
 @image_comparison(baseline_images=['violinplot_horiz_baseline'],
                   extensions=['png'])
 def test_horiz_violinplot_baseline():
@@ -2406,7 +2443,8 @@ def test_horiz_violinplot_baseline():
                   showextrema=0, showmedians=0)
 
 
-@image_comparison(baseline_images=['violinplot_horiz_showmedians'],
+@image_comparison(baseline_images=['violinplot_horiz_showmedians',
+                                   'violinplot_horiz_showmedians'],
                   extensions=['png'])
 def test_horiz_violinplot_showmedians():
     ax = plt.axes()
@@ -2415,9 +2453,15 @@ def test_horiz_violinplot_showmedians():
     data = [np.random.normal(size=100) for i in range(4)]
     ax.violinplot(data, positions=range(4), vert=False, showmeans=0,
                   showextrema=0, showmedians=1)
+    fig, ax = plt.subplots()
+    ax = plt.axes()
+    ax.violinplot(data, statistics_function_list=[np.median],
+                  positions=range(4), vert=False,
+                  showmeans=0, showextrema=0, showmedians=0)
 
 
-@image_comparison(baseline_images=['violinplot_horiz_showmeans'],
+@image_comparison(baseline_images=['violinplot_horiz_showmeans',
+                                   'violinplot_horiz_showmeans'],
                   extensions=['png'])
 def test_horiz_violinplot_showmeans():
     ax = plt.axes()
@@ -2426,6 +2470,11 @@ def test_horiz_violinplot_showmeans():
     data = [np.random.normal(size=100) for i in range(4)]
     ax.violinplot(data, positions=range(4), vert=False, showmeans=1,
                   showextrema=0, showmedians=0)
+    fig, ax = plt.subplots()
+    ax = plt.axes()
+    ax.violinplot(data, statistics_function_list=[np.mean],
+                  positions=range(4), vert=False,
+                  showmeans=0, showmedians=0, showextrema=0)
 
 
 @image_comparison(baseline_images=['violinplot_horiz_showextrema'],
@@ -2472,6 +2521,31 @@ def test_horiz_violinplot_custompoints_200():
                   showextrema=0, showmedians=0, points=200)
 
 
+@image_comparison(baseline_images=['violinplot_horiz_showstdev',
+                                   'violinplot_horiz_show95_5percentiles'],
+                  extensions=['png'])
+def test_horiz_violinplot_showcustomstat():
+    ax = plt.axes()
+    # First 9 digits of frac(sqrt(31))
+    np.random.seed(567764362)
+    data = [np.random.normal(size=100) for i in range(4)]
+    func_list = [lambda x: np.mean(x) + np.std(x),
+                 lambda x: np.mean(x) - np.std(x)]
+    ax.violinplot(data, statistics_function_list=func_list,
+                  positions=range(4), vert=False, showmeans=0,
+                  showextrema=0, showmedians=0)
+    fig, ax = plt.subplots()
+    ax = plt.axes()
+    from matplotlib.axes._axes import ViolinStatFunc
+    percentile95 = ViolinStatFunc(np.percentile,
+                                  alias='95 percentile', args=[95])
+    percentile5 = ViolinStatFunc(np.percentile,
+                                 alias='5 percentile', args=[5])
+    ax.violinplot(data, statistics_function_list=[percentile95, percentile5],
+                  positions=range(4), vert=False, showmeans=0,
+                  showextrema=0, showmedians=0)
+
+
 def test_violinplot_bad_positions():
     ax = plt.axes()
     # First 9 digits of frac(sqrt(47))