From d370b4a72eafc2fe614a9509f37c8d74ed2d0a42 Mon Sep 17 00:00:00 2001
From: Marco Gorelli <marcogorelli@protonmail.com>
Date: Mon, 8 Feb 2021 21:10:23 +0000
Subject: [PATCH 1/7] use ast.parse to fixup inconsistencies in namespace

---
 .pre-commit-config.yaml                       |   3 +-
 pandas/tests/frame/indexing/test_indexing.py  |   8 +-
 pandas/tests/frame/methods/test_describe.py   |   2 +-
 pandas/tests/frame/methods/test_diff.py       |   4 +-
 pandas/tests/frame/methods/test_drop.py       |   4 +-
 pandas/tests/frame/methods/test_join.py       |   2 +-
 .../tests/frame/methods/test_reset_index.py   |   6 +-
 pandas/tests/frame/methods/test_to_csv.py     |  33 +++---
 pandas/tests/frame/test_api.py                |   4 +-
 pandas/tests/frame/test_constructors.py       |   5 +-
 pandas/tests/frame/test_query_eval.py         |   2 +-
 pandas/tests/frame/test_reductions.py         |  22 ++--
 pandas/tests/frame/test_stack_unstack.py      |  10 +-
 pandas/tests/frame/test_subclass.py           |   6 +-
 ...check_for_inconsistent_pandas_namespace.py | 112 ++++++++++++------
 .../test_inconsistent_namespace_check.py      |  40 ++++---
 16 files changed, 155 insertions(+), 108 deletions(-)

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index e0df3434b2906..1c5400d0b294a 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -138,7 +138,8 @@ repos:
         entry: python scripts/check_for_inconsistent_pandas_namespace.py
         language: python
         types: [python]
-        files: ^pandas/tests/
+        files: ^pandas/tests/frame/
+        additional_dependencies: [tokenize-rt]
     -   id: FrameOrSeriesUnion
         name: Check for use of Union[Series, DataFrame] instead of FrameOrSeriesUnion alias
         entry: Union\[.*(Series,.*DataFrame|DataFrame,.*Series).*\]
diff --git a/pandas/tests/frame/indexing/test_indexing.py b/pandas/tests/frame/indexing/test_indexing.py
index 6808ffe65e561..acbff73b69c4d 100644
--- a/pandas/tests/frame/indexing/test_indexing.py
+++ b/pandas/tests/frame/indexing/test_indexing.py
@@ -212,7 +212,7 @@ def test_setitem_multi_index(self):
         it = ["jim", "joe", "jolie"], ["first", "last"], ["left", "center", "right"]
 
         cols = MultiIndex.from_product(it)
-        index = pd.date_range("20141006", periods=20)
+        index = date_range("20141006", periods=20)
         vals = np.random.randint(1, 1000, (len(index), len(cols)))
         df = DataFrame(vals, columns=cols, index=index)
 
@@ -1349,7 +1349,7 @@ def test_loc_duplicates(self):
         # gh-17105
 
         # insert a duplicate element to the index
-        trange = pd.date_range(
+        trange = date_range(
             start=Timestamp(year=2017, month=1, day=1),
             end=Timestamp(year=2017, month=1, day=5),
         )
@@ -1413,7 +1413,7 @@ def test_setitem_with_unaligned_tz_aware_datetime_column(self):
         # GH 12981
         # Assignment of unaligned offset-aware datetime series.
         # Make sure timezone isn't lost
-        column = Series(pd.date_range("2015-01-01", periods=3, tz="utc"), name="dates")
+        column = Series(date_range("2015-01-01", periods=3, tz="utc"), name="dates")
         df = DataFrame({"dates": column})
         df["dates"] = column[[1, 0, 2]]
         tm.assert_series_equal(df["dates"], column)
@@ -1737,7 +1737,7 @@ def test_object_casting_indexing_wraps_datetimelike():
     df = DataFrame(
         {
             "A": [1, 2],
-            "B": pd.date_range("2000", periods=2),
+            "B": date_range("2000", periods=2),
             "C": pd.timedelta_range("1 Day", periods=2),
         }
     )
diff --git a/pandas/tests/frame/methods/test_describe.py b/pandas/tests/frame/methods/test_describe.py
index 15bafb7a835ba..5aade25b1871b 100644
--- a/pandas/tests/frame/methods/test_describe.py
+++ b/pandas/tests/frame/methods/test_describe.py
@@ -277,7 +277,7 @@ def test_describe_tz_values(self, tz_naive_fixture):
         tm.assert_frame_equal(result, expected)
 
     def test_datetime_is_numeric_includes_datetime(self):
-        df = DataFrame({"a": pd.date_range("2012", periods=3), "b": [1, 2, 3]})
+        df = DataFrame({"a": date_range("2012", periods=3), "b": [1, 2, 3]})
         result = df.describe(datetime_is_numeric=True)
         expected = DataFrame(
             {
diff --git a/pandas/tests/frame/methods/test_diff.py b/pandas/tests/frame/methods/test_diff.py
index b8328b43a6b13..a5835ff9bfda2 100644
--- a/pandas/tests/frame/methods/test_diff.py
+++ b/pandas/tests/frame/methods/test_diff.py
@@ -75,7 +75,7 @@ def test_diff_datetime_axis0_with_nat(self, tz):
     @pytest.mark.parametrize("tz", [None, "UTC"])
     def test_diff_datetime_with_nat_zero_periods(self, tz):
         # diff on NaT values should give NaT, not timedelta64(0)
-        dti = pd.date_range("2016-01-01", periods=4, tz=tz)
+        dti = date_range("2016-01-01", periods=4, tz=tz)
         ser = Series(dti)
         df = ser.to_frame()
 
@@ -173,7 +173,7 @@ def test_diff_axis(self):
 
     def test_diff_period(self):
         # GH#32995 Don't pass an incorrect axis
-        pi = pd.date_range("2016-01-01", periods=3).to_period("D")
+        pi = date_range("2016-01-01", periods=3).to_period("D")
         df = DataFrame({"A": pi})
 
         result = df.diff(1, axis=1)
diff --git a/pandas/tests/frame/methods/test_drop.py b/pandas/tests/frame/methods/test_drop.py
index 4568cda24d5cf..a7fdb3ead5ef1 100644
--- a/pandas/tests/frame/methods/test_drop.py
+++ b/pandas/tests/frame/methods/test_drop.py
@@ -21,7 +21,7 @@
 def test_drop_raise_exception_if_labels_not_in_level(msg, labels, level):
     # GH 8594
     mi = MultiIndex.from_arrays([[1, 2, 3], [4, 5, 6]], names=["a", "b"])
-    s = pd.Series([10, 20, 30], index=mi)
+    s = Series([10, 20, 30], index=mi)
     df = DataFrame([10, 20, 30], index=mi)
 
     with pytest.raises(KeyError, match=msg):
@@ -34,7 +34,7 @@ def test_drop_raise_exception_if_labels_not_in_level(msg, labels, level):
 def test_drop_errors_ignore(labels, level):
     # GH 8594
     mi = MultiIndex.from_arrays([[1, 2, 3], [4, 5, 6]], names=["a", "b"])
-    s = pd.Series([10, 20, 30], index=mi)
+    s = Series([10, 20, 30], index=mi)
     df = DataFrame([10, 20, 30], index=mi)
 
     expected_s = s.drop(labels, level=level, errors="ignore")
diff --git a/pandas/tests/frame/methods/test_join.py b/pandas/tests/frame/methods/test_join.py
index 42694dc3ff37c..4e3db5256d434 100644
--- a/pandas/tests/frame/methods/test_join.py
+++ b/pandas/tests/frame/methods/test_join.py
@@ -304,7 +304,7 @@ def test_join_multiindex_leftright(self):
         tm.assert_frame_equal(df1.join(df2, how="left"), exp)
         tm.assert_frame_equal(df2.join(df1, how="right"), exp[["value2", "value1"]])
 
-        exp_idx = pd.MultiIndex.from_product(
+        exp_idx = MultiIndex.from_product(
             [["a", "b"], ["x", "y", "z"]], names=["first", "second"]
         )
         exp = DataFrame(
diff --git a/pandas/tests/frame/methods/test_reset_index.py b/pandas/tests/frame/methods/test_reset_index.py
index 8644f56e4f253..28ed94fb7fb03 100644
--- a/pandas/tests/frame/methods/test_reset_index.py
+++ b/pandas/tests/frame/methods/test_reset_index.py
@@ -423,7 +423,7 @@ def test_reset_index_multiindex_columns(self):
     def test_reset_index_datetime(self, tz_naive_fixture):
         # GH#3950
         tz = tz_naive_fixture
-        idx1 = pd.date_range("1/1/2011", periods=5, freq="D", tz=tz, name="idx1")
+        idx1 = date_range("1/1/2011", periods=5, freq="D", tz=tz, name="idx1")
         idx2 = Index(range(5), name="idx2", dtype="int64")
         idx = MultiIndex.from_arrays([idx1, idx2])
         df = DataFrame(
@@ -450,7 +450,7 @@ def test_reset_index_datetime(self, tz_naive_fixture):
 
         tm.assert_frame_equal(df.reset_index(), expected)
 
-        idx3 = pd.date_range(
+        idx3 = date_range(
             "1/1/2012", periods=5, freq="MS", tz="Europe/Paris", name="idx3"
         )
         idx = MultiIndex.from_arrays([idx1, idx2, idx3])
@@ -489,7 +489,7 @@ def test_reset_index_datetime(self, tz_naive_fixture):
 
         # GH#7793
         idx = MultiIndex.from_product(
-            [["a", "b"], pd.date_range("20130101", periods=3, tz=tz)]
+            [["a", "b"], date_range("20130101", periods=3, tz=tz)]
         )
         df = DataFrame(
             np.arange(6, dtype="int64").reshape(6, 1), columns=["a"], index=idx
diff --git a/pandas/tests/frame/methods/test_to_csv.py b/pandas/tests/frame/methods/test_to_csv.py
index 4cf0b1febf0af..aed784a6e4c3c 100644
--- a/pandas/tests/frame/methods/test_to_csv.py
+++ b/pandas/tests/frame/methods/test_to_csv.py
@@ -12,6 +12,7 @@
     DataFrame,
     Index,
     MultiIndex,
+    NaT,
     Series,
     Timestamp,
     date_range,
@@ -41,7 +42,7 @@ def read_csv(self, path, **kwargs):
         params = {"index_col": 0, "parse_dates": True}
         params.update(**kwargs)
 
-        return pd.read_csv(path, **params)
+        return read_csv(path, **params)
 
     def test_to_csv_from_csv1(self, float_frame, datetime_frame):
 
@@ -123,7 +124,7 @@ def test_to_csv_from_csv3(self):
             df1.to_csv(path)
             df2.to_csv(path, mode="a", header=False)
             xp = pd.concat([df1, df2])
-            rs = pd.read_csv(path, index_col=0)
+            rs = read_csv(path, index_col=0)
             rs.columns = [int(label) for label in rs.columns]
             xp.columns = [int(label) for label in xp.columns]
             tm.assert_frame_equal(xp, rs)
@@ -139,7 +140,7 @@ def test_to_csv_from_csv4(self):
             )
             df.to_csv(path)
 
-            result = pd.read_csv(path, index_col="dt_index")
+            result = read_csv(path, index_col="dt_index")
             result.index = pd.to_timedelta(result.index)
             # TODO: remove renaming when GH 10875 is solved
             result.index = result.index.rename("dt_index")
@@ -153,7 +154,7 @@ def test_to_csv_from_csv5(self, timezone_frame):
         with tm.ensure_clean("__tmp_to_csv_from_csv5__") as path:
 
             timezone_frame.to_csv(path)
-            result = pd.read_csv(path, index_col=0, parse_dates=["A"])
+            result = read_csv(path, index_col=0, parse_dates=["A"])
 
             converter = (
                 lambda c: to_datetime(result[c])
@@ -166,8 +167,6 @@ def test_to_csv_from_csv5(self, timezone_frame):
 
     def test_to_csv_cols_reordering(self):
         # GH3454
-        import pandas as pd
-
         chunksize = 5
         N = int(chunksize * 2.5)
 
@@ -177,17 +176,15 @@ def test_to_csv_cols_reordering(self):
 
         with tm.ensure_clean() as path:
             df.to_csv(path, columns=cols, chunksize=chunksize)
-            rs_c = pd.read_csv(path, index_col=0)
+            rs_c = read_csv(path, index_col=0)
 
         tm.assert_frame_equal(df[cols], rs_c, check_names=False)
 
     def test_to_csv_new_dupe_cols(self):
-        import pandas as pd
-
         def _check_df(df, cols=None):
             with tm.ensure_clean() as path:
                 df.to_csv(path, columns=cols, chunksize=chunksize)
-                rs_c = pd.read_csv(path, index_col=0)
+                rs_c = read_csv(path, index_col=0)
 
                 # we wrote them in a different order
                 # so compare them in that order
@@ -227,8 +224,6 @@ def _check_df(df, cols=None):
     @pytest.mark.slow
     def test_to_csv_dtnat(self):
         # GH3437
-        from pandas import NaT
-
         def make_dtnat_arr(n, nnat=None):
             if nnat is None:
                 nnat = int(n * 0.1)  # 10%
@@ -999,7 +994,7 @@ def test_to_csv_path_is_none(self, float_frame):
         # Series.to_csv()
         csv_str = float_frame.to_csv(path_or_buf=None)
         assert isinstance(csv_str, str)
-        recons = pd.read_csv(StringIO(csv_str), index_col=0)
+        recons = read_csv(StringIO(csv_str), index_col=0)
         tm.assert_frame_equal(float_frame, recons)
 
     @pytest.mark.parametrize(
@@ -1040,7 +1035,7 @@ def test_to_csv_compression(self, df, encoding, compression):
                 df.to_csv(handles.handle, encoding=encoding)
                 assert not handles.handle.closed
 
-            result = pd.read_csv(
+            result = read_csv(
                 filename,
                 compression=compression,
                 encoding=encoding,
@@ -1122,7 +1117,7 @@ def test_to_csv_with_dst_transitions(self):
 
         with tm.ensure_clean("csv_date_format_with_dst") as path:
             # make sure we are not failing on transitions
-            times = pd.date_range(
+            times = date_range(
                 "2013-10-26 23:00",
                 "2013-10-27 01:00",
                 tz="Europe/London",
@@ -1144,7 +1139,7 @@ def test_to_csv_with_dst_transitions(self):
                 tm.assert_frame_equal(result, df)
 
         # GH11619
-        idx = pd.date_range("2015-01-01", "2015-12-31", freq="H", tz="Europe/Paris")
+        idx = date_range("2015-01-01", "2015-12-31", freq="H", tz="Europe/Paris")
         idx = idx._with_freq(None)  # freq does not round-trip
         idx._data._freq = None  # otherwise there is trouble on unpickle
         df = DataFrame({"values": 1, "idx": idx}, index=idx)
@@ -1250,7 +1245,7 @@ def test_to_csv_quoting(self):
         # presents with encoding?
         text_rows = ["a,b,c", '1,"test \r\n",3']
         text = tm.convert_rows_list_to_csv_str(text_rows)
-        df = pd.read_csv(StringIO(text))
+        df = read_csv(StringIO(text))
 
         buf = StringIO()
         df.to_csv(buf, encoding="utf-8", index=False)
@@ -1286,7 +1281,7 @@ def test_period_index_date_overflow(self):
         assert result == expected
 
         # Overflow with pd.NaT
-        dates = ["1990-01-01", pd.NaT, "3005-01-01"]
+        dates = ["1990-01-01", NaT, "3005-01-01"]
         index = pd.PeriodIndex(dates, freq="D")
 
         df = DataFrame([4, 5, 6], index=index)
@@ -1298,7 +1293,7 @@ def test_period_index_date_overflow(self):
 
     def test_multi_index_header(self):
         # see gh-5539
-        columns = pd.MultiIndex.from_tuples([("a", 1), ("a", 2), ("b", 1), ("b", 2)])
+        columns = MultiIndex.from_tuples([("a", 1), ("a", 2), ("b", 1), ("b", 2)])
         df = DataFrame([[1, 2, 3, 4], [5, 6, 7, 8]])
         df.columns = columns
 
diff --git a/pandas/tests/frame/test_api.py b/pandas/tests/frame/test_api.py
index 6b8284908213a..6a19d205b4954 100644
--- a/pandas/tests/frame/test_api.py
+++ b/pandas/tests/frame/test_api.py
@@ -65,7 +65,7 @@ def test_tab_completion(self):
         df = DataFrame([list("abcd"), list("efgh")], columns=list("ABCD"))
         for key in list("ABCD"):
             assert key in dir(df)
-        assert isinstance(df.__getitem__("A"), pd.Series)
+        assert isinstance(df.__getitem__("A"), Series)
 
         # DataFrame whose first-level columns are identifiers shall have
         # them in __dir__.
@@ -77,7 +77,7 @@ def test_tab_completion(self):
             assert key in dir(df)
         for key in list("EFGH"):
             assert key not in dir(df)
-        assert isinstance(df.__getitem__("A"), pd.DataFrame)
+        assert isinstance(df.__getitem__("A"), DataFrame)
 
     def test_not_hashable(self):
         empty_frame = DataFrame()
diff --git a/pandas/tests/frame/test_constructors.py b/pandas/tests/frame/test_constructors.py
index 9ec745932514f..253f66d899193 100644
--- a/pandas/tests/frame/test_constructors.py
+++ b/pandas/tests/frame/test_constructors.py
@@ -33,6 +33,7 @@
 )
 import pandas._testing as tm
 from pandas.arrays import IntervalArray, PeriodArray, SparseArray
+from pandas.core.construction import array as pd_array
 
 MIXED_FLOAT_DTYPES = ["float16", "float32", "float64"]
 MIXED_INT_DTYPES = [
@@ -753,7 +754,7 @@ def test_constructor_extension_scalar_data(self, data, dtype):
         assert df["a"].dtype == dtype
         assert df["b"].dtype == dtype
 
-        arr = pd.array([data] * 2, dtype=dtype)
+        arr = pd_array([data] * 2, dtype=dtype)
         expected = DataFrame({"a": arr, "b": arr})
 
         tm.assert_frame_equal(df, expected)
@@ -2179,7 +2180,7 @@ class DatetimeSubclass(datetime):
 
     def test_with_mismatched_index_length_raises(self):
         # GH#33437
-        dti = pd.date_range("2016-01-01", periods=3, tz="US/Pacific")
+        dti = date_range("2016-01-01", periods=3, tz="US/Pacific")
         with pytest.raises(ValueError, match="Shape of passed values"):
             DataFrame(dti, index=range(4))
 
diff --git a/pandas/tests/frame/test_query_eval.py b/pandas/tests/frame/test_query_eval.py
index af134db587306..d9c602e5438d0 100644
--- a/pandas/tests/frame/test_query_eval.py
+++ b/pandas/tests/frame/test_query_eval.py
@@ -713,7 +713,7 @@ def test_inf(self):
     def test_check_tz_aware_index_query(self, tz_aware_fixture):
         # https://github.com/pandas-dev/pandas/issues/29463
         tz = tz_aware_fixture
-        df_index = pd.date_range(
+        df_index = date_range(
             start="2019-01-01", freq="1d", periods=10, tz=tz, name="time"
         )
         expected = DataFrame(index=df_index)
diff --git a/pandas/tests/frame/test_reductions.py b/pandas/tests/frame/test_reductions.py
index 1c397d6a6a1b5..83441c7606069 100644
--- a/pandas/tests/frame/test_reductions.py
+++ b/pandas/tests/frame/test_reductions.py
@@ -825,7 +825,7 @@ def test_sum_nanops_timedelta(self):
         idx = ["a", "b", "c"]
         df = DataFrame({"a": [0, 0], "b": [0, np.nan], "c": [np.nan, np.nan]})
 
-        df2 = df.apply(pd.to_timedelta)
+        df2 = df.apply(to_timedelta)
 
         # 0 by default
         result = df2.sum()
@@ -855,9 +855,9 @@ def test_sum_bool(self, float_frame):
 
     def test_sum_mixed_datetime(self):
         # GH#30886
-        df = DataFrame(
-            {"A": pd.date_range("2000", periods=4), "B": [1, 2, 3, 4]}
-        ).reindex([2, 3, 4])
+        df = DataFrame({"A": date_range("2000", periods=4), "B": [1, 2, 3, 4]}).reindex(
+            [2, 3, 4]
+        )
         result = df.sum()
 
         expected = Series({"B": 7.0})
@@ -887,7 +887,7 @@ def test_mean_datetimelike(self):
         df = DataFrame(
             {
                 "A": np.arange(3),
-                "B": pd.date_range("2016-01-01", periods=3),
+                "B": date_range("2016-01-01", periods=3),
                 "C": pd.timedelta_range("1D", periods=3),
                 "D": pd.period_range("2016", periods=3, freq="A"),
             }
@@ -906,7 +906,7 @@ def test_mean_datetimelike_numeric_only_false(self):
         df = DataFrame(
             {
                 "A": np.arange(3),
-                "B": pd.date_range("2016-01-01", periods=3),
+                "B": date_range("2016-01-01", periods=3),
                 "C": pd.timedelta_range("1D", periods=3),
             }
         )
@@ -977,7 +977,7 @@ def test_idxmax(self, float_frame, int_frame):
 
     def test_idxmax_mixed_dtype(self):
         # don't cast to object, which would raise in nanops
-        dti = pd.date_range("2016-01-01", periods=3)
+        dti = date_range("2016-01-01", periods=3)
 
         df = DataFrame({1: [0, 2, 1], 2: range(3)[::-1], 3: dti})
 
@@ -1267,8 +1267,8 @@ def test_min_max_dt64_api_consistency_with_NaT(self):
         # returned NaT for series. These tests check that the API is consistent in
         # min/max calls on empty Series/DataFrames. See GH:33704 for more
         # information
-        df = DataFrame({"x": pd.to_datetime([])})
-        expected_dt_series = Series(pd.to_datetime([]))
+        df = DataFrame({"x": to_datetime([])})
+        expected_dt_series = Series(to_datetime([]))
         # check axis 0
         assert (df.min(axis=0).x is pd.NaT) == (expected_dt_series.min() is pd.NaT)
         assert (df.max(axis=0).x is pd.NaT) == (expected_dt_series.max() is pd.NaT)
@@ -1296,7 +1296,7 @@ def test_min_max_dt64_api_consistency_empty_df(self):
     @pytest.mark.parametrize("method", ["min", "max"])
     def test_preserve_timezone(self, initial: str, method):
         # GH 28552
-        initial_dt = pd.to_datetime(initial)
+        initial_dt = to_datetime(initial)
         expected = Series([initial_dt])
         df = DataFrame([expected])
         result = getattr(df, method)(axis=1)
@@ -1324,7 +1324,7 @@ def test_frame_any_with_timedelta(self):
         df = DataFrame(
             {
                 "a": Series([0, 0]),
-                "t": Series([pd.to_timedelta(0, "s"), pd.to_timedelta(1, "ms")]),
+                "t": Series([to_timedelta(0, "s"), to_timedelta(1, "ms")]),
             }
         )
 
diff --git a/pandas/tests/frame/test_stack_unstack.py b/pandas/tests/frame/test_stack_unstack.py
index 81e10d276e79c..b226ec72bf8a6 100644
--- a/pandas/tests/frame/test_stack_unstack.py
+++ b/pandas/tests/frame/test_stack_unstack.py
@@ -150,7 +150,7 @@ def test_unstack_fill_frame(self):
     def test_unstack_fill_frame_datetime(self):
 
         # Test unstacking with date times
-        dv = pd.date_range("2012-01-01", periods=4).values
+        dv = date_range("2012-01-01", periods=4).values
         data = Series(dv)
         data.index = MultiIndex.from_tuples(
             [("x", "a"), ("x", "b"), ("y", "b"), ("z", "a")]
@@ -600,7 +600,7 @@ def test_unstack_dtypes(self):
                     "A": ["a"] * 5,
                     "C": c,
                     "D": d,
-                    "B": pd.date_range("2012-01-01", periods=5),
+                    "B": date_range("2012-01-01", periods=5),
                 }
             )
 
@@ -934,7 +934,7 @@ def verify(df):
         df = DataFrame(
             {
                 "1st": [1, 2, 1, 2, 1, 2],
-                "2nd": pd.date_range("2014-02-01", periods=6, freq="D"),
+                "2nd": date_range("2014-02-01", periods=6, freq="D"),
                 "jim": 100 + np.arange(6),
                 "joe": (np.random.randn(6) * 10).round(2),
             }
@@ -1163,9 +1163,7 @@ def test_unstack_timezone_aware_values():
 
 def test_stack_timezone_aware_values():
     # GH 19420
-    ts = pd.date_range(
-        freq="D", start="20180101", end="20180103", tz="America/New_York"
-    )
+    ts = date_range(freq="D", start="20180101", end="20180103", tz="America/New_York")
     df = DataFrame({"A": ts}, index=["a", "b", "c"])
     result = df.stack()
     expected = Series(
diff --git a/pandas/tests/frame/test_subclass.py b/pandas/tests/frame/test_subclass.py
index 2b462d5a10c51..73eb31087bb11 100644
--- a/pandas/tests/frame/test_subclass.py
+++ b/pandas/tests/frame/test_subclass.py
@@ -56,11 +56,11 @@ def custom_frame_function(self):
         assert cdf_rows.custom_frame_function() == "OK"
 
         # Make sure sliced part of multi-index frame is custom class
-        mcol = pd.MultiIndex.from_tuples([("A", "A"), ("A", "B")])
+        mcol = MultiIndex.from_tuples([("A", "A"), ("A", "B")])
         cdf_multi = CustomDataFrame([[0, 1], [2, 3]], columns=mcol)
         assert isinstance(cdf_multi["A"], CustomDataFrame)
 
-        mcol = pd.MultiIndex.from_tuples([("A", ""), ("B", "")])
+        mcol = MultiIndex.from_tuples([("A", ""), ("B", "")])
         cdf_multi2 = CustomDataFrame([[0, 1], [2, 3]], columns=mcol)
         assert isinstance(cdf_multi2["A"], CustomSeries)
 
@@ -700,7 +700,7 @@ def test_idxmax_preserves_subclass(self):
     def test_equals_subclass(self):
         # https://github.com/pandas-dev/pandas/pull/34402
         # allow subclass in both directions
-        df1 = pd.DataFrame({"a": [1, 2, 3]})
+        df1 = DataFrame({"a": [1, 2, 3]})
         df2 = tm.SubclassedDataFrame({"a": [1, 2, 3]})
         assert df1.equals(df2)
         assert df2.equals(df1)
diff --git a/scripts/check_for_inconsistent_pandas_namespace.py b/scripts/check_for_inconsistent_pandas_namespace.py
index b213d931e7f07..e6774492eb267 100644
--- a/scripts/check_for_inconsistent_pandas_namespace.py
+++ b/scripts/check_for_inconsistent_pandas_namespace.py
@@ -7,52 +7,94 @@
 This is meant to be run as a pre-commit hook - to run it manually, you can do:
 
     pre-commit run inconsistent-namespace-usage --all-files
+
+To automatically fixup a given file, you can pass `--replace`, e.g.
+
+    python scripts/check_for_inconsistent_pandas_namespace.py test_me.py --replace
+
+Note that you may need to manually fixup some imports.
 """
 
 import argparse
-from pathlib import Path
-import re
-from typing import Optional, Sequence
-
-PATTERN = r"""
-    (
-        (?<!pd\.)(?<!\w)    # check class_name doesn't start with pd. or character
-        ([A-Z]\w+)\(        # match DataFrame but not pd.DataFrame or tm.makeDataFrame
-        .*                  # match anything
-        pd\.\2\(            # only match e.g. pd.DataFrame
-    )|
-    (
-        pd\.([A-Z]\w+)\(    # only match e.g. pd.DataFrame
-        .*                  # match anything
-        (?<!pd\.)(?<!\w)    # check class_name doesn't start with pd. or character
-        \4\(                # match DataFrame but not pd.DataFrame or tm.makeDataFrame
-    )
-    """
-ERROR_MESSAGE = "Found both `pd.{class_name}` and `{class_name}` in {path}"
+import ast
+from typing import MutableMapping, Optional, Sequence, Set
+
+from tokenize_rt import Offset, reversed_enumerate, src_to_tokens, tokens_to_src
+
+ERROR_MESSAGE = "Found both `pd.{name}` and `{name}` in {path}"
+EXCLUDE = {
+    "np",  # pd.np is deprecated but still tested
+    "eval",
+}
+
+
+class Visitor(ast.NodeVisitor):
+    def __init__(self):
+        self.pandas_namespace: MutableMapping[Offset, str] = {}
+        self.no_namespace: Set[str] = set()
+
+    def visit_Attribute(self, node: ast.Attribute) -> None:
+        if (
+            isinstance(node.value, ast.Name)
+            and node.value.id == "pd"
+            and node.attr not in EXCLUDE
+        ):
+            self.pandas_namespace[(node.lineno, node.col_offset)] = node.attr
+        self.generic_visit(node)
+
+    def visit_Name(self, node: ast.Name):
+        if node.id not in EXCLUDE:
+            self.no_namespace.add(node.id)
+        self.generic_visit(node)
+
+
+def check_for_inconsistent_pandas_namespace(content, path, *, replace):
+    tree = ast.parse(content)
+
+    visitor = Visitor()
+    visitor.visit(tree)
+
+    tokens = src_to_tokens(content)
+
+    if not visitor.no_namespace.intersection(visitor.pandas_namespace.values()):
+        # No inconsistent namespace usage, nothing to replace.
+        return content
+
+    for n, i in reversed_enumerate(tokens):
+        if (
+            i.offset in visitor.pandas_namespace
+            and visitor.pandas_namespace[i.offset] in visitor.no_namespace
+        ):
+            if not replace:
+                raise RuntimeError(
+                    ERROR_MESSAGE.format(
+                        name=visitor.pandas_namespace[i.offset], path=path
+                    )
+                )
+            # Replace `pd`
+            tokens[n] = i._replace(src="")
+            # Replace `.`
+            tokens[n + 1] = i._replace(src="")
+
+    return tokens_to_src(tokens)
 
 
 def main(argv: Optional[Sequence[str]] = None) -> None:
     parser = argparse.ArgumentParser()
-    parser.add_argument("paths", nargs="*", type=Path)
+    parser.add_argument("paths", nargs="*")
+    parser.add_argument("--replace", action="store_true")
     args = parser.parse_args(argv)
 
-    pattern = re.compile(
-        PATTERN.encode(),
-        flags=re.MULTILINE | re.DOTALL | re.VERBOSE,
-    )
     for path in args.paths:
-        contents = path.read_bytes()
-        match = pattern.search(contents)
-        if match is None:
+        with open(path, encoding="utf-8") as fd:
+            content = fd.read()
+        new_content = check_for_inconsistent_pandas_namespace(
+            content, path, replace=args.replace
+        )
+        if not args.replace:
             continue
-        if match.group(2) is not None:
-            raise AssertionError(
-                ERROR_MESSAGE.format(class_name=match.group(2).decode(), path=str(path))
-            )
-        if match.group(4) is not None:
-            raise AssertionError(
-                ERROR_MESSAGE.format(class_name=match.group(4).decode(), path=str(path))
-            )
+        with open(path, "w", encoding="utf-8") as fd:
+            fd.write(new_content)
 
 
 if __name__ == "__main__":
diff --git a/scripts/tests/test_inconsistent_namespace_check.py b/scripts/tests/test_inconsistent_namespace_check.py
index 37e6d288d9341..cc3509af5b138 100644
--- a/scripts/tests/test_inconsistent_namespace_check.py
+++ b/scripts/tests/test_inconsistent_namespace_check.py
@@ -1,28 +1,38 @@
-from pathlib import Path
-
 import pytest
 
-from scripts.check_for_inconsistent_pandas_namespace import main
+from scripts.check_for_inconsistent_pandas_namespace import (
+    check_for_inconsistent_pandas_namespace,
+)
 
 BAD_FILE_0 = "cat_0 = Categorical()\ncat_1 = pd.Categorical()"
 BAD_FILE_1 = "cat_0 = pd.Categorical()\ncat_1 = Categorical()"
 GOOD_FILE_0 = "cat_0 = Categorical()\ncat_1 = Categorical()"
 GOOD_FILE_1 = "cat_0 = pd.Categorical()\ncat_1 = pd.Categorical()"
+PATH = "t.py"
+
+
+@pytest.mark.parametrize("content", [BAD_FILE_0, BAD_FILE_1])
+def test_inconsistent_usage(content):
+    msg = r"Found both `pd\.Categorical` and `Categorical` in t\.py"
+    with pytest.raises(RuntimeError, match=msg):
+        check_for_inconsistent_pandas_namespace(content, PATH, replace=False)
+
+
+@pytest.mark.parametrize("content", [GOOD_FILE_0, GOOD_FILE_1])
+def test_consistent_usage(content):
+    # should not raise
+    check_for_inconsistent_pandas_namespace(content, PATH, replace=False)
 
 
 @pytest.mark.parametrize("content", [BAD_FILE_0, BAD_FILE_1])
-def test_inconsistent_usage(tmpdir, content):
-    tmpfile = Path(tmpdir / "tmpfile.py")
-    tmpfile.touch()
-    tmpfile.write_text(content)
-    msg = fr"Found both `pd\.Categorical` and `Categorical` in {str(tmpfile)}"
-    with pytest.raises(AssertionError, match=msg):
-        main((str(tmpfile),))
+def test_inconsistent_usage_with_replace(content):
+    result = check_for_inconsistent_pandas_namespace(content, PATH, replace=True)
+    expected = "cat_0 = Categorical()\ncat_1 = Categorical()"
+    assert result == expected
 
 
 @pytest.mark.parametrize("content", [GOOD_FILE_0, GOOD_FILE_1])
-def test_consistent_usage(tmpdir, content):
-    tmpfile = Path(tmpdir / "tmpfile.py")
-    tmpfile.touch()
-    tmpfile.write_text(content)
-    main((str(tmpfile),))  # Should not raise.
+def test_consistent_usage_with_replace(content):
+    result = check_for_inconsistent_pandas_namespace(content, PATH, replace=True)
+    expected = content
+    assert result == expected

From 65dbc19e691b0eec1fb6eb779b168202df76e16c Mon Sep 17 00:00:00 2001
From: Marco Gorelli <marcogorelli@protonmail.com>
Date: Tue, 9 Feb 2021 09:05:55 +0000
Subject: [PATCH 2/7] use Offset namedtuple

---
 scripts/check_for_inconsistent_pandas_namespace.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/scripts/check_for_inconsistent_pandas_namespace.py b/scripts/check_for_inconsistent_pandas_namespace.py
index e6774492eb267..372b7e1be9698 100644
--- a/scripts/check_for_inconsistent_pandas_namespace.py
+++ b/scripts/check_for_inconsistent_pandas_namespace.py
@@ -39,7 +39,7 @@ def visit_Attribute(self, node: ast.Attribute) -> None:
             and node.value.id == "pd"
             and node.attr not in EXCLUDE
         ):
-            self.pandas_namespace[(node.lineno, node.col_offset)] = node.attr
+            self.pandas_namespace[Offset(node.lineno, node.col_offset)] = node.attr
         self.generic_visit(node)
 
     def visit_Name(self, node: ast.Name):

From 285abca625f88bc634a57f04f04ac17efb79b4bf Mon Sep 17 00:00:00 2001
From: Marco Gorelli <marcogorelli@protonmail.com>
Date: Tue, 9 Feb 2021 09:08:52 +0000
Subject: [PATCH 3/7] strict typing

---
 scripts/check_for_inconsistent_pandas_namespace.py | 13 ++++++++-----
 1 file changed, 8 insertions(+), 5 deletions(-)

diff --git a/scripts/check_for_inconsistent_pandas_namespace.py b/scripts/check_for_inconsistent_pandas_namespace.py
index 372b7e1be9698..f80fac9b3fbab 100644
--- a/scripts/check_for_inconsistent_pandas_namespace.py
+++ b/scripts/check_for_inconsistent_pandas_namespace.py
@@ -29,7 +29,7 @@
 
 
 class Visitor(ast.NodeVisitor):
-    def __init__(self):
+    def __init__(self) -> None:
         self.pandas_namespace: MutableMapping[Offset, str] = {}
         self.no_namespace: Set[str] = set()
 
@@ -42,13 +42,15 @@ def visit_Attribute(self, node: ast.Attribute) -> None:
             self.pandas_namespace[Offset(node.lineno, node.col_offset)] = node.attr
         self.generic_visit(node)
 
-    def visit_Name(self, node: ast.Name):
+    def visit_Name(self, node: ast.Name) -> None:
         if node.id not in EXCLUDE:
             self.no_namespace.add(node.id)
         self.generic_visit(node)
 
 
-def check_for_inconsistent_pandas_namespace(content, path, *, replace):
+def check_for_inconsistent_pandas_namespace(
+    content: str, path: str, *, replace: bool
+) -> Optional[str]:
     tree = ast.parse(content)
 
     visitor = Visitor()
@@ -76,7 +78,8 @@ def check_for_inconsistent_pandas_namespace(content, path, *, replace):
             # Replace `.`
             tokens[n + 1] = i._replace(src="")
 
-    return tokens_to_src(tokens)
+    new_src: str = tokens_to_src(tokens)
+    return new_src
 
 
 def main(argv: Optional[Sequence[str]] = None) -> None:
@@ -91,7 +94,7 @@ def main(argv: Optional[Sequence[str]] = None) -> None:
         new_content = check_for_inconsistent_pandas_namespace(
             content, path, replace=args.replace
         )
-        if not args.replace:
+        if not args.replace or new_content is None:
             continue
         with open(path, "w", encoding="utf-8") as fd:
             fd.write(new_content)

From 1f6eba019e5ff271ac54bae27d51e977f512a85f Mon Sep 17 00:00:00 2001
From: MarcoGorelli <marcogorelli@protonmail.com>
Date: Wed, 10 Feb 2021 15:06:54 +0000
Subject: [PATCH 4/7] exclude array

---
 pandas/tests/frame/test_constructors.py            |  3 +--
 scripts/check_for_inconsistent_pandas_namespace.py | 10 +++++-----
 2 files changed, 6 insertions(+), 7 deletions(-)

diff --git a/pandas/tests/frame/test_constructors.py b/pandas/tests/frame/test_constructors.py
index 253f66d899193..aa83ec9a056bf 100644
--- a/pandas/tests/frame/test_constructors.py
+++ b/pandas/tests/frame/test_constructors.py
@@ -33,7 +33,6 @@
 )
 import pandas._testing as tm
 from pandas.arrays import IntervalArray, PeriodArray, SparseArray
-from pandas.core.construction import array as pd_array
 
 MIXED_FLOAT_DTYPES = ["float16", "float32", "float64"]
 MIXED_INT_DTYPES = [
@@ -754,7 +753,7 @@ def test_constructor_extension_scalar_data(self, data, dtype):
         assert df["a"].dtype == dtype
         assert df["b"].dtype == dtype
 
-        arr = pd_array([data] * 2, dtype=dtype)
+        arr = pd.array([data] * 2, dtype=dtype)
         expected = DataFrame({"a": arr, "b": arr})
 
         tm.assert_frame_equal(df, expected)
diff --git a/scripts/check_for_inconsistent_pandas_namespace.py b/scripts/check_for_inconsistent_pandas_namespace.py
index f80fac9b3fbab..ac71deb129d7e 100644
--- a/scripts/check_for_inconsistent_pandas_namespace.py
+++ b/scripts/check_for_inconsistent_pandas_namespace.py
@@ -23,8 +23,9 @@
 
 ERROR_MESSAGE = "Found both `pd.{name}` and `{name}` in {path}"
 EXCLUDE = {
+    "array",  # `import array` and `pd.array` should both be allowed
+    "eval",  # built-in, different from `pd.eval`
     "np",  # pd.np is deprecated but still tested
-    "eval",
 }
 
 
@@ -68,11 +69,10 @@ def check_for_inconsistent_pandas_namespace(
             and visitor.pandas_namespace[i.offset] in visitor.no_namespace
         ):
             if not replace:
-                raise RuntimeError(
-                    ERROR_MESSAGE.format(
-                        name=visitor.pandas_namespace[i.offset], path=path
-                    )
+                msg = ERROR_MESSAGE.format(
+                    name=visitor.pandas_namespace[i.offset], path=path
                 )
+                raise RuntimeError(msg)
             # Replace `pd`
             tokens[n] = i._replace(src="")
             # Replace `.`

From 02e89bd9d2413dc8b9e46b129fa9a56c067c22f1 Mon Sep 17 00:00:00 2001
From: MarcoGorelli <marcogorelli@protonmail.com>
Date: Tue, 16 Feb 2021 15:48:51 +0000
Subject: [PATCH 5/7] replace next token

---
 scripts/check_for_inconsistent_pandas_namespace.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/scripts/check_for_inconsistent_pandas_namespace.py b/scripts/check_for_inconsistent_pandas_namespace.py
index ac71deb129d7e..b644959157e11 100644
--- a/scripts/check_for_inconsistent_pandas_namespace.py
+++ b/scripts/check_for_inconsistent_pandas_namespace.py
@@ -76,7 +76,7 @@ def check_for_inconsistent_pandas_namespace(
             # Replace `pd`
             tokens[n] = i._replace(src="")
             # Replace `.`
-            tokens[n + 1] = i._replace(src="")
+            tokens[n + 1] = tokens[n+1]._replace(src="")
 
     new_src: str = tokens_to_src(tokens)
     return new_src

From a673ec2cad2dbeaa4c3cf732015caaa098bbb2f7 Mon Sep 17 00:00:00 2001
From: MarcoGorelli <marcogorelli@protonmail.com>
Date: Tue, 16 Feb 2021 15:56:53 +0000
Subject: [PATCH 6/7] fixup

---
 scripts/check_for_inconsistent_pandas_namespace.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/scripts/check_for_inconsistent_pandas_namespace.py b/scripts/check_for_inconsistent_pandas_namespace.py
index 6c28a7f11a233..8e87dbaef7ea9 100644
--- a/scripts/check_for_inconsistent_pandas_namespace.py
+++ b/scripts/check_for_inconsistent_pandas_namespace.py
@@ -86,7 +86,7 @@ def check_for_inconsistent_pandas_namespace(
             # Replace `pd`
             tokens[n] = i._replace(src="")
             # Replace `.`
-            tokens[n + 1] = tokens[n+1]._replace(src="")
+            tokens[n + 1] = tokens[n + 1]._replace(src="")
 
     new_src: str = tokens_to_src(tokens)
     return new_src

From a8854a2a8c25dfb932bae5a68fc21ce3cde5ba58 Mon Sep 17 00:00:00 2001
From: Marco Gorelli <marcogorelli@protonmail.com>
Date: Tue, 16 Feb 2021 20:44:32 +0000
Subject: [PATCH 7/7] dont require tokenize-rt for pre-commit hook

---
 .pre-commit-config.yaml                       |  1 -
 ...check_for_inconsistent_pandas_namespace.py | 54 +++++++++++--------
 2 files changed, 31 insertions(+), 24 deletions(-)

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 93b48f11a5f94..d433fb08209bf 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -139,7 +139,6 @@ repos:
         language: python
         types: [python]
         files: ^pandas/tests/frame/
-        additional_dependencies: [tokenize-rt]
     -   id: FrameOrSeriesUnion
         name: Check for use of Union[Series, DataFrame] instead of FrameOrSeriesUnion alias
         entry: Union\[.*(Series,.*DataFrame|DataFrame,.*Series).*\]
diff --git a/scripts/check_for_inconsistent_pandas_namespace.py b/scripts/check_for_inconsistent_pandas_namespace.py
index ac71deb129d7e..f9d1d5fa3892c 100644
--- a/scripts/check_for_inconsistent_pandas_namespace.py
+++ b/scripts/check_for_inconsistent_pandas_namespace.py
@@ -12,14 +12,14 @@
 
     python scripts/check_for_inconsistent_pandas_namespace.py test_me.py --replace
 
-Note that you may need to manually fixup some imports.
+though note that you may need to manually fixup some imports and that you will also
+need the additional dependency `tokenize-rt` (which is left out from the pre-commit
+hook so that it uses the same virtualenv as the other local ones).
 """
 
 import argparse
 import ast
-from typing import MutableMapping, Optional, Sequence, Set
-
-from tokenize_rt import Offset, reversed_enumerate, src_to_tokens, tokens_to_src
+from typing import MutableMapping, Optional, Sequence, Set, Tuple
 
 ERROR_MESSAGE = "Found both `pd.{name}` and `{name}` in {path}"
 EXCLUDE = {
@@ -27,6 +27,7 @@
     "eval",  # built-in, different from `pd.eval`
     "np",  # pd.np is deprecated but still tested
 }
+Offset = Tuple[int, int]
 
 
 class Visitor(ast.NodeVisitor):
@@ -40,7 +41,7 @@ def visit_Attribute(self, node: ast.Attribute) -> None:
             and node.value.id == "pd"
             and node.attr not in EXCLUDE
         ):
-            self.pandas_namespace[Offset(node.lineno, node.col_offset)] = node.attr
+            self.pandas_namespace[(node.lineno, node.col_offset)] = node.attr
         self.generic_visit(node)
 
     def visit_Name(self, node: ast.Name) -> None:
@@ -49,39 +50,46 @@ def visit_Name(self, node: ast.Name) -> None:
         self.generic_visit(node)
 
 
-def check_for_inconsistent_pandas_namespace(
-    content: str, path: str, *, replace: bool
-) -> Optional[str]:
-    tree = ast.parse(content)
-
-    visitor = Visitor()
-    visitor.visit(tree)
+def replace_inconsistent_pandas_namespace(visitor: Visitor, content: str) -> str:
+    from tokenize_rt import reversed_enumerate, src_to_tokens, tokens_to_src
 
     tokens = src_to_tokens(content)
-
-    if not visitor.no_namespace.intersection(visitor.pandas_namespace.values()):
-        # No inconsistent namespace usage, nothing to replace.
-        return content
-
     for n, i in reversed_enumerate(tokens):
         if (
             i.offset in visitor.pandas_namespace
             and visitor.pandas_namespace[i.offset] in visitor.no_namespace
         ):
-            if not replace:
-                msg = ERROR_MESSAGE.format(
-                    name=visitor.pandas_namespace[i.offset], path=path
-                )
-                raise RuntimeError(msg)
             # Replace `pd`
             tokens[n] = i._replace(src="")
             # Replace `.`
-            tokens[n + 1] = i._replace(src="")
+            tokens[n + 1] = tokens[n + 1]._replace(src="")
 
     new_src: str = tokens_to_src(tokens)
     return new_src
 
 
+def check_for_inconsistent_pandas_namespace(
+    content: str, path: str, *, replace: bool
+) -> Optional[str]:
+    tree = ast.parse(content)
+
+    visitor = Visitor()
+    visitor.visit(tree)
+
+    inconsistencies = visitor.no_namespace.intersection(
+        visitor.pandas_namespace.values()
+    )
+    if not inconsistencies:
+        # No inconsistent namespace usage, nothing to replace.
+        return content
+
+    if not replace:
+        msg = ERROR_MESSAGE.format(name=inconsistencies.pop(), path=path)
+        raise RuntimeError(msg)
+
+    return replace_inconsistent_pandas_namespace(visitor, content)
+
+
 def main(argv: Optional[Sequence[str]] = None) -> None:
     parser = argparse.ArgumentParser()
     parser.add_argument("paths", nargs="*")