clean up and parametrize mode tests and add versionadded

reidy-p · reidy-p · commit b523d23f2259 · 2018-05-02T20:55:37.000+01:00
diff --git a/pandas/core/algorithms.py b/pandas/core/algorithms.py
@@ -809,6 +809,8 @@ def mode(values, dropna=True):
     dropna : boolean, default True
         Don't consider counts of NaN/NaT.
 
+        .. versionadded:: 0.23.0
+
     Returns
     -------
     mode : Series
diff --git a/pandas/core/arrays/categorical.py b/pandas/core/arrays/categorical.py
@@ -2128,6 +2128,8 @@ def mode(self, dropna=True):
         dropna : boolean, default True
             Don't consider counts of NaN/NaT.
 
+            .. versionadded:: 0.23.0
+
         Returns
         -------
         modes : `Categorical` (sorted)
diff --git a/pandas/core/frame.py b/pandas/core/frame.py
@@ -326,7 +326,6 @@ def _constructor(self):
     _constructor_sliced = Series
     _deprecations = NDFrame._deprecations | frozenset(
         ['sortlevel', 'get_value', 'set_value', 'from_csv', 'from_items'])
-    _accessors = set()
 
     @property
     def _constructor_expanddim(self):
@@ -7059,6 +7058,8 @@ def mode(self, axis=0, numeric_only=False, dropna=True):
         dropna : boolean, default True
             Don't consider counts of NaN/NaT.
 
+            .. versionadded:: 0.23.0
+
         Returns
         -------
         modes : DataFrame (sorted)
@@ -7126,10 +7127,6 @@ def quantile(self, q=0.5, axis=0, numeric_only=True,
                a     b
         0.1  1.3   3.7
         0.5  2.5  55.0
-
-        See Also
-        --------
-        pandas.core.window.Rolling.quantile
         """
         self._check_percentile(q)
 
diff --git a/pandas/core/series.py b/pandas/core/series.py
@@ -1441,6 +1441,8 @@ def mode(self, dropna=True):
         dropna : boolean, default True
             Don't consider counts of NaN/NaT.
 
+            .. versionadded:: 0.23.0
+
         Returns
         -------
         modes : Series (sorted)
diff --git a/pandas/tests/frame/test_analytics.py b/pandas/tests/frame/test_analytics.py
@@ -20,7 +20,6 @@
 import pandas as pd
 import pandas.core.nanops as nanops
 import pandas.core.algorithms as algorithms
-import pandas.io.formats.printing as printing
 
 import pandas.util.testing as tm
 import pandas.util._test_decorators as td
@@ -841,87 +840,62 @@ def wrapper(x):
                 expected = pd.Series(unit, index=r1.index, dtype=r1.dtype)
                 tm.assert_series_equal(r1, expected)
 
-    def test_mode(self):
-        df = pd.DataFrame({"A": [12, 12, 11, 12, 19, 11],
-                           "B": [10, 10, 10, np.nan, 3, 4],
-                           "C": [8, 8, 8, 9, 9, 9],
-                           "D": np.arange(6, dtype='int64'),
-                           "E": [8, 8, 1, 1, 3, 3]})
-        tm.assert_frame_equal(df[["A"]].mode(),
-                              pd.DataFrame({"A": [12]}))
-        expected = pd.Series([0, 1, 2, 3, 4, 5], dtype='int64', name='D').\
-            to_frame()
-        tm.assert_frame_equal(df[["D"]].mode(), expected)
-        expected = pd.Series([1, 3, 8], dtype='int64', name='E').to_frame()
-        tm.assert_frame_equal(df[["E"]].mode(), expected)
-        tm.assert_frame_equal(df[["A", "B"]].mode(),
-                              pd.DataFrame({"A": [12], "B": [10.]}))
-        tm.assert_frame_equal(df.mode(),
-                              pd.DataFrame({"A": [12, np.nan, np.nan, np.nan,
-                                                  np.nan, np.nan],
-                                            "B": [10, np.nan, np.nan, np.nan,
-                                                  np.nan, np.nan],
-                                            "C": [8, 9, np.nan, np.nan, np.nan,
-                                                  np.nan],
-                                            "D": [0, 1, 2, 3, 4, 5],
-                                            "E": [1, 3, 8, np.nan, np.nan,
-                                                  np.nan]}))
-
-        # outputs in sorted order
-        df["C"] = list(reversed(df["C"]))
-        printing.pprint_thing(df["C"])
-        printing.pprint_thing(df["C"].mode())
-        a, b = (df[["A", "B", "C"]].mode(),
-                pd.DataFrame({"A": [12, np.nan],
-                              "B": [10, np.nan],
-                              "C": [8, 9]}))
-        printing.pprint_thing(a)
-        printing.pprint_thing(b)
-        tm.assert_frame_equal(a, b)
-        # should work with heterogeneous types
-        df = pd.DataFrame({"A": np.arange(6, dtype='int64'),
-                           "B": pd.date_range('2011', periods=6),
-                           "C": list('abcdef')})
-        exp = pd.DataFrame({"A": pd.Series(np.arange(6, dtype='int64'),
-                                           dtype=df["A"].dtype),
-                            "B": pd.Series(pd.date_range('2011', periods=6),
-                                           dtype=df["B"].dtype),
-                            "C": pd.Series(list('abcdef'),
-                                           dtype=df["C"].dtype)})
-        tm.assert_frame_equal(df.mode(), exp)
-
-    def test_mode_dropna(self):
-        # GH 17534
-        # Test the dropna=False parameter for mode
-
-        df = pd.DataFrame({"A": [1, np.nan, np.nan, np.nan],
-                           "B": [np.nan, np.nan, 'a', np.nan],
-                           "C": Categorical([np.nan, np.nan, 'a', np.nan]),
-                           "D": to_datetime(['NaT', '2000-1-2', 'NaT', 'NaT']),
-                           "E": to_timedelta(['1 days', 'nan', 'nan', 'nan']),
-                           "F": [1, 1, np.nan, np.nan],
-                           "G": [np.nan, np.nan, 'a', 'a'],
-                           "H": Categorical(['a', np.nan, 'a', np.nan]),
-                           "I": to_datetime(['2000-1-2', '2000-1-2',
+    @pytest.mark.parametrize("dropna, expected", [
+        (True, {'A': [12],
+                'B': [10.0],
+                'C': [1.0],
+                'D': ['a'],
+                'E': Categorical(['a'], categories=['a']),
+                'F': to_datetime(['2000-1-2']),
+                'G': to_timedelta(['1 days'])}),
+        (False, {'A': [12],
+                 'B': [10.0],
+                 'C': [np.nan],
+                 'D': np.array([np.nan], dtype=object),
+                 'E': Categorical([np.nan], categories=['a']),
+                 'F': [pd.NaT],
+                 'G': to_timedelta([pd.NaT])}),
+        (True, {'H': [8, 9, np.nan, np.nan],
+                'I': [8, 9, np.nan, np.nan],
+                'J': [1, np.nan, np.nan, np.nan],
+                'K': ['a', np.nan, np.nan, np.nan],
+                'L': Categorical(['a', np.nan, np.nan, np.nan],
+                                 categories=['a']),
+                'M': to_datetime(['2000-1-2', 'NaT', 'NaT', 'NaT']),
+                'N': to_timedelta(['1 days', 'nan', 'nan', 'nan']),
+                'O': [0, 1, 2, 3]}),
+        (False, {'H': [8, 9, np.nan, np.nan],
+                 'I': [8, 9, np.nan, np.nan],
+                 'J': [1, np.nan, np.nan, np.nan],
+                 'K': [np.nan, 'a', np.nan, np.nan],
+                 'L': Categorical([np.nan, 'a', np.nan, np.nan],
+                                  categories=['a']),
+                 'M': to_datetime(['NaT', '2000-1-2', 'NaT', 'NaT']),
+                 'N': to_timedelta(['nan', '1 days', 'nan', 'nan']),
+                 'O': [0, 1, 2, 3]})
+    ])
+    def test_mode_dropna(self, dropna, expected):
+
+        df = pd.DataFrame({"A": [12, 12, 19, 11],
+                           "B": [10, 10, np.nan, 3],
+                           "C": [1, np.nan, np.nan, np.nan],
+                           "D": [np.nan, np.nan, 'a', np.nan],
+                           "E": Categorical([np.nan, np.nan, 'a', np.nan]),
+                           "F": to_datetime(['NaT', '2000-1-2', 'NaT', 'NaT']),
+                           "G": to_timedelta(['1 days', 'nan', 'nan', 'nan']),
+                           "H": [8, 8, 9, 9],
+                           "I": [9, 9, 8, 8],
+                           "J": [1, 1, np.nan, np.nan],
+                           "K": [np.nan, np.nan, 'a', 'a'],
+                           "L": Categorical(['a', np.nan, 'a', np.nan]),
+                           "M": to_datetime(['2000-1-2', '2000-1-2',
                                              'NaT', 'NaT']),
-                           "J": to_timedelta(['1 days', 'nan',
-                                              '1 days', 'nan'])})
-
-        result = df.loc[:, 'A':'E'].mode(dropna=False)
-        expected = pd.DataFrame({'A': [np.nan],
-                                 'B': np.array([np.nan], dtype=object),
-                                 'C': Categorical([np.nan], categories=['a']),
-                                 'D': [pd.NaT],
-                                 'E': to_timedelta([pd.NaT])})
-        tm.assert_frame_equal(result, expected)
-
-        result = df.loc[:, 'F':'J'].mode(dropna=False)
-        expected = pd.DataFrame({'F': [1, np.nan],
-                                 'G': [np.nan, 'a'],
-                                 'H': Categorical([np.nan, 'a'],
-                                                  categories=['a']),
-                                 'I': to_datetime(['NaT', '2000-1-2']),
-                                 'J': to_timedelta(['nan', '1 days'])})
+                           "N": to_timedelta(['1 days', 'nan',
+                                              '1 days', 'nan']),
+                           "O": np.arange(4, dtype='int64')})
+
+        result = df[sorted(list(expected.keys()))].mode(dropna=dropna)
+        expected = pd.DataFrame(expected)
         tm.assert_frame_equal(result, expected)
 
     def test_operators_timedelta64(self):
diff --git a/pandas/tests/series/test_analytics.py b/pandas/tests/series/test_analytics.py