pandas-dev · MarcoGorelli · Feb 28, 2020 · Feb 29, 2020 · Feb 29, 2020 · Feb 29, 2020
diff --git a/doc/source/whatsnew/v1.1.0.rst b/doc/source/whatsnew/v1.1.0.rst
@@ -166,6 +166,31 @@ key and type of :class:`Index`.  These now consistently raise ``KeyError`` (:iss
     ...
     KeyError: Timestamp('1970-01-01 00:00:00')
 
+GroupBy.rolling no longer returns grouped-by column in values
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+*Previous behavior*:
+
+.. code-block:: ipython
+
+    In [1]: df = pd.DataFrame({"A": [1, 1, 2, 3], "B": [0, 1, 2, 3]})
+
+    In [2]: df.groupby("A").rolling(2).sum()
+    Out[2]:
+           A    B
+    A
+    1 0  NaN  NaN
+    1    2.0  1.0
+    2 2  NaN  NaN
+    3 3  NaN  NaN
+
+*New behavior*:
+
+.. ipython:: python
+
+    df = pd.DataFrame({"A": [1, 1, 2, 3], "B": [0, 1, 2, 3]})
+    df.groupby("A").rolling(2).sum()
+
 .. ---------------------------------------------------------------------------
 
 .. _whatsnew_110.api_breaking.assignment_to_multiple_columns:

diff --git a/pandas/core/base.py b/pandas/core/base.py
@@ -207,11 +207,14 @@ def _obj_with_exclusions(self):
         if self._selection is not None and isinstance(self.obj, ABCDataFrame):
             return self.obj.reindex(columns=self._selection_list)
 
-        if len(self.exclusions) > 0:
-            return self.obj.drop(self.exclusions, axis=1)
-        else:
+        if not isinstance(self.obj, ABCDataFrame) or not self.exclusions:
             return self.obj
 
+        # there may be elements in self.exclusions that are no longer
+        # in self.obj, see GH 32468
+        exclusions = self.exclusions.intersection(self.obj.columns)
+        return self.obj.drop(exclusions, axis=1)
+
     def __getitem__(self, key):
         if self._selection is not None:
             raise IndexError(f"Column(s) {self._selection} already selected")

diff --git a/pandas/core/groupby/groupby.py b/pandas/core/groupby/groupby.py
@@ -1577,6 +1577,7 @@ def rolling(self, *args, **kwargs):
         """
         from pandas.core.window import RollingGroupby
 
+        kwargs["exclusions"] = self.exclusions
         return RollingGroupby(self, *args, **kwargs)
 
     @Substitution(name="groupby")

diff --git a/pandas/core/window/ewm.py b/pandas/core/window/ewm.py
@@ -142,6 +142,7 @@ def __init__(
         adjust=True,
         ignore_na=False,
         axis=0,
+        **kwargs,
     ):
         self.obj = obj
         self.com = _get_center_of_mass(com, span, halflife, alpha)

diff --git a/pandas/core/window/rolling.py b/pandas/core/window/rolling.py
@@ -93,6 +93,13 @@ def __init__(
         self.axis = obj._get_axis_number(axis) if axis is not None else None
         self.validate()
         self._numba_func_cache: Dict[Optional[str], Callable] = dict()
+        self.exclusions = kwargs.get("exclusions", set())
+
+    def _shallow_copy(self, obj: FrameOrSeries, **kwargs) -> ShallowMixin:
+        exclusions = self.exclusions
+        new_obj = super()._shallow_copy(obj, exclusions=exclusions, **kwargs)
+        new_obj.obj = new_obj._obj_with_exclusions
+        return new_obj
 
     @property
     def _constructor(self):

diff --git a/pandas/tests/groupby/test_groupby.py b/pandas/tests/groupby/test_groupby.py
@@ -5,8 +5,6 @@
 import numpy as np
 import pytest
 
-from pandas.errors import PerformanceWarning
-
 import pandas as pd
 from pandas import DataFrame, Index, MultiIndex, Series, Timestamp, date_range, read_csv
 import pandas._testing as tm
@@ -1565,8 +1563,7 @@ def test_groupby_multiindex_not_lexsorted():
     tm.assert_frame_equal(lexsorted_df, not_lexsorted_df)
 
     expected = lexsorted_df.groupby("a").mean()
-    with tm.assert_produces_warning(PerformanceWarning):
-        result = not_lexsorted_df.groupby("a").mean()
+    result = not_lexsorted_df.groupby("a").mean()
     tm.assert_frame_equal(expected, result)
 
     # a transforming function should work regardless of sort

diff --git a/pandas/tests/window/test_grouper.py b/pandas/tests/window/test_grouper.py
@@ -62,11 +62,15 @@ def test_rolling(self):
         for f in ["sum", "mean", "min", "max", "count", "kurt", "skew"]:
             result = getattr(r, f)()
             expected = g.apply(lambda x: getattr(x.rolling(4), f)())
+            # groupby.apply doesn't drop the grouped-by column
+            expected = expected.drop("A", axis=1)
             tm.assert_frame_equal(result, expected)
 
         for f in ["std", "var"]:
             result = getattr(r, f)(ddof=1)
             expected = g.apply(lambda x: getattr(x.rolling(4), f)(ddof=1))
+            # groupby.apply doesn't drop the grouped-by column
+            expected = expected.drop("A", axis=1)
             tm.assert_frame_equal(result, expected)
 
     @pytest.mark.parametrize(
@@ -79,6 +83,8 @@ def test_rolling_quantile(self, interpolation):
         expected = g.apply(
             lambda x: x.rolling(4).quantile(0.4, interpolation=interpolation)
         )
+        # groupby.apply doesn't drop the grouped-by column
+        expected = expected.drop("A", axis=1)
         tm.assert_frame_equal(result, expected)
 
     def test_rolling_corr_cov(self):
@@ -92,6 +98,8 @@ def func(x):
                 return getattr(x.rolling(4), f)(self.frame)
 
             expected = g.apply(func)
+            # groupby.apply doesn't drop the grouped-by column
+            expected = expected.drop("A", axis=1)
             tm.assert_frame_equal(result, expected)
 
             result = getattr(r.B, f)(pairwise=True)
@@ -109,6 +117,8 @@ def test_rolling_apply(self, raw):
         # reduction
         result = r.apply(lambda x: x.sum(), raw=raw)
         expected = g.apply(lambda x: x.rolling(4).apply(lambda y: y.sum(), raw=raw))
+        # groupby.apply doesn't drop the grouped-by column
+        expected = expected.drop("A", axis=1)
         tm.assert_frame_equal(result, expected)
 
     def test_rolling_apply_mutability(self):

diff --git a/pandas/tests/window/test_rolling.py b/pandas/tests/window/test_rolling.py
@@ -465,3 +465,15 @@ def test_rolling_count_default_min_periods_with_null_values(constructor):
     result = constructor(values).rolling(3).count()
     expected = constructor(expected_counts)
     tm.assert_equal(result, expected)
+
+
+def test_by_column_not_in_values():
+    # GH 32262
+    df = pd.DataFrame({"A": [1] * 20 + [2] * 12 + [3] * 8, "B": np.arange(40)})
+
+    g = df.groupby("A")
+    original_obj = g.obj.copy(deep=True)
+    r = g.rolling(4)
+    result = r.sum()
+    assert "A" not in result.columns
+    tm.assert_frame_equal(g.obj, original_obj)  # check for side-effects