pandas-dev · WillAyd · Jun 22, 2020 · Apr 12, 2020 · May 17, 2020 · May 18, 2020
diff --git a/pandas/plotting/_core.py b/pandas/plotting/_core.py
@@ -21,6 +21,7 @@ def hist_series(
     yrot=None,
     figsize=None,
     bins=10,
+    legend=False,
     backend=None,
     **kwargs,
 ):
@@ -50,6 +51,8 @@ def hist_series(
         bin edges are calculated and returned. If bins is a sequence, gives
         bin edges, including left edge of first bin and right edge of last
         bin. In this case, bins is returned unmodified.
+    legend : bool, default False
+        Whether to show the legend.
     backend : str, default None
         Backend to use instead of the backend specified in the option
         ``plotting.backend``. For instance, 'matplotlib'. Alternatively, to
@@ -82,6 +85,7 @@ def hist_series(
         yrot=yrot,
         figsize=figsize,
         bins=bins,
+        legend=legend,
         **kwargs,
     )
 
@@ -101,6 +105,7 @@ def hist_frame(
     figsize=None,
     layout=None,
     bins=10,
+    legend=False,
     backend=None,
     **kwargs,
 ):
@@ -154,6 +159,8 @@ def hist_frame(
         bin edges are calculated and returned. If bins is a sequence, gives
         bin edges, including left edge of first bin and right edge of last
         bin. In this case, bins is returned unmodified.
+    legend : bool, default False
+        Whether to show the legend.
     backend : str, default None
         Backend to use instead of the backend specified in the option
         ``plotting.backend``. For instance, 'matplotlib'. Alternatively, to
@@ -203,6 +210,7 @@ def hist_frame(
         sharey=sharey,
         figsize=figsize,
         layout=layout,
+        legend=legend,
         bins=bins,
         **kwargs,
     )

diff --git a/pandas/plotting/_matplotlib/hist.py b/pandas/plotting/_matplotlib/hist.py
@@ -225,6 +225,7 @@ def _grouped_hist(
     xrot=None,
     ylabelsize=None,
     yrot=None,
+    legend=False,
     **kwargs,
 ):
     """
@@ -243,15 +244,27 @@ def _grouped_hist(
     sharey : bool, default False
     rot : int, default 90
     grid : bool, default True
+    legend: : bool, default False
     kwargs : dict, keyword arguments passed to matplotlib.Axes.hist
 
     Returns
     -------
     collection of Matplotlib Axes
     """
 
+    if legend and "label" not in kwargs:
+        if isinstance(data, ABCDataFrame):
+            if column is None:
+                kwargs["label"] = data.columns
+            else:
+                kwargs["label"] = column
+        else:
+            kwargs["label"] = data.name
+
     def plot_group(group, ax):
         ax.hist(group.dropna().values, bins=bins, **kwargs)
+        if legend:
+            ax.legend()
 
     if xrot is None:
         xrot = rot
@@ -290,6 +303,7 @@ def hist_series(
     yrot=None,
     figsize=None,
     bins=10,
+    legend=False,
     **kwds,
 ):
     import matplotlib.pyplot as plt
@@ -308,8 +322,11 @@ def hist_series(
         elif ax.get_figure() != fig:
             raise AssertionError("passed axis not bound to passed figure")
         values = self.dropna().values
-
+        if legend and "label" not in kwds:
+            kwds["label"] = self.name
         ax.hist(values, bins=bins, **kwds)
+        if legend:
+            ax.legend()
         ax.grid(grid)
         axes = np.array([ax])
 
@@ -334,6 +351,7 @@ def hist_series(
             xrot=xrot,
             ylabelsize=ylabelsize,
             yrot=yrot,
+            legend=legend,
             **kwds,
         )
 
@@ -358,6 +376,7 @@ def hist_frame(
     figsize=None,
     layout=None,
     bins=10,
+    legend=False,
     **kwds,
 ):
     if by is not None:
@@ -376,6 +395,7 @@ def hist_frame(
             xrot=xrot,
             ylabelsize=ylabelsize,
             yrot=yrot,
+            legend=legend,
             **kwds,
         )
         return axes
@@ -401,11 +421,17 @@ def hist_frame(
     )
     _axes = _flatten(axes)
 
+    can_set_label = "label" not in kwds
+
     for i, col in enumerate(data.columns):
         ax = _axes[i]
+        if legend and can_set_label:
+            kwds["label"] = col
         ax.hist(data[col].dropna().values, bins=bins, **kwds)
         ax.set_title(col)
         ax.grid(grid)
+        if legend:
+            ax.legend()
 
     _set_ticks_props(
         axes, xlabelsize=xlabelsize, xrot=xrot, ylabelsize=ylabelsize, yrot=yrot

diff --git a/pandas/tests/plotting/test_groupby.py b/pandas/tests/plotting/test_groupby.py
@@ -2,10 +2,11 @@
 
 
 import numpy as np
+import pytest
 
 import pandas.util._test_decorators as td
 
-from pandas import DataFrame, Series
+from pandas import DataFrame, Index, Series
 import pandas._testing as tm
 from pandas.tests.plotting.common import TestPlotBase
 
@@ -65,3 +66,18 @@ def test_plot_kwargs(self):
 
         res = df.groupby("z").plot.scatter(x="x", y="y")
         assert len(res["a"].collections) == 1
+
+
+@td.skip_if_no_mpl
+@pytest.mark.parametrize("column", [None, "b"])
+@pytest.mark.parametrize("label", [None, "d"])
+def test_hist_with_legend(column, label):
+    index = Index(15 * [1] + 15 * [2], name="c")
+    df = DataFrame(np.random.randn(30, 2), index=index, columns=["a", "b"])
+    g = df.groupby("c")
+
+    g.hist(column=column, label=label, legend=True)
+    tm.close()
+    if column != "b":
+        g["a"].hist(label=label, legend=True)
+        tm.close()
diff --git a/pandas/tests/plotting/test_hist_method.py b/pandas/tests/plotting/test_hist_method.py
@@ -6,7 +6,7 @@
 
 import pandas.util._test_decorators as td
 
-from pandas import DataFrame, Series
+from pandas import DataFrame, Index, Series
 import pandas._testing as tm
 from pandas.tests.plotting.common import TestPlotBase, _check_plot_works
 
@@ -293,6 +293,28 @@ def test_hist_column_order_unchanged(self, column, expected):
 
         assert result == expected
 
+    @pytest.mark.slow
+    @pytest.mark.parametrize("by", [None, "b"])
+    @pytest.mark.parametrize("label", [None, "c"])
+    def test_hist_with_legend(self, by, label):
+        expected_labels = label or "a"
+        expected_axes_num = 1 if by is None else 2
+        expected_layout = (1, 1) if by is None else (1, 2)
+
+        index = 15 * [1] + 15 * [2]
+        s = Series(np.random.randn(30), index=index, name="a")
+        s.index.name = "b"
+
+        kwargs = {"legend": True, "by": by}
+        if label is not None:
+            # Behavior differs if kwargs contains "label": None
+            kwargs["label"] = label
+
+        _check_plot_works(s.hist, **kwargs)
+        axes = s.hist(**kwargs)
+        self._check_axes_shape(axes, axes_num=expected_axes_num, layout=expected_layout)
+        self._check_legend_labels(axes, expected_labels)
+
 
 @td.skip_if_no_mpl
 class TestDataFrameGroupByPlots(TestPlotBase):
@@ -484,3 +506,30 @@ def test_axis_share_xy(self):
 
         assert ax1._shared_y_axes.joined(ax1, ax2)
         assert ax2._shared_y_axes.joined(ax1, ax2)
+
+    @pytest.mark.slow
+    @pytest.mark.parametrize("by", [None, "c"])
+    @pytest.mark.parametrize("column", [None, "b"])
+    @pytest.mark.parametrize("label", [None, "d"])
+    def test_hist_with_legend(self, by, column, label):
+        expected_axes_num = 1 if by is None and column is not None else 2
+        expected_layout = (1, expected_axes_num)
+        expected_labels = label or column or ["a", "b"]
+        if by is not None:
+            expected_labels = [expected_labels] * 2
+
+        index = Index(15 * [1] + 15 * [2], name="c")
+        df = DataFrame(np.random.randn(30, 2), index=index, columns=["a", "b"])
+
+        kwargs = {"legend": True, "by": by, "column": column}
+        if label is not None:
+            # Behavior differs if kwargs contains "label": None
+            kwargs["label"] = label
+
+        _check_plot_works(df.hist, **kwargs)
+        axes = df.hist(**kwargs)
+        self._check_axes_shape(axes, axes_num=expected_axes_num, layout=expected_layout)
+        if by is None:
+            axes = axes[0]
+        for expected_label, ax in zip(expected_labels, axes):
+            self._check_legend_labels(ax, expected_label)