Skip to content

Commit 147d68a

Browse files
authored
TST/CLN: Remove makeTime methods (#56264)
* Remove makeTimeDataFrame * Remove makeTimeSeriesData * Remove getCols * Remove use makeCustomIndex usage * Fix tests
1 parent 958e7f5 commit 147d68a

34 files changed

+596
-200
lines changed

pandas/_testing/__init__.py

-19
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,6 @@
66
import operator
77
import os
88
import re
9-
import string
109
from sys import byteorder
1110
from typing import (
1211
TYPE_CHECKING,
@@ -109,7 +108,6 @@
109108
from pandas.core.arrays import ArrowExtensionArray
110109

111110
_N = 30
112-
_K = 4
113111

114112
UNSIGNED_INT_NUMPY_DTYPES: list[NpDtype] = ["uint8", "uint16", "uint32", "uint64"]
115113
UNSIGNED_INT_EA_DTYPES: list[Dtype] = ["UInt8", "UInt16", "UInt32", "UInt64"]
@@ -341,10 +339,6 @@ def to_array(obj):
341339
# Others
342340

343341

344-
def getCols(k) -> str:
345-
return string.ascii_uppercase[:k]
346-
347-
348342
def makeTimeSeries(nper=None, freq: Frequency = "B", name=None) -> Series:
349343
if nper is None:
350344
nper = _N
@@ -355,16 +349,6 @@ def makeTimeSeries(nper=None, freq: Frequency = "B", name=None) -> Series:
355349
)
356350

357351

358-
def getTimeSeriesData(nper=None, freq: Frequency = "B") -> dict[str, Series]:
359-
return {c: makeTimeSeries(nper, freq) for c in getCols(_K)}
360-
361-
362-
# make frame
363-
def makeTimeDataFrame(nper=None, freq: Frequency = "B") -> DataFrame:
364-
data = getTimeSeriesData(nper, freq)
365-
return DataFrame(data)
366-
367-
368352
def makeCustomIndex(
369353
nentries,
370354
nlevels,
@@ -887,21 +871,18 @@ def shares_memory(left, right) -> bool:
887871
"external_error_raised",
888872
"FLOAT_EA_DTYPES",
889873
"FLOAT_NUMPY_DTYPES",
890-
"getCols",
891874
"get_cython_table_params",
892875
"get_dtype",
893876
"getitem",
894877
"get_locales",
895878
"get_finest_unit",
896879
"get_obj",
897880
"get_op_from_name",
898-
"getTimeSeriesData",
899881
"iat",
900882
"iloc",
901883
"loc",
902884
"makeCustomDataframe",
903885
"makeCustomIndex",
904-
"makeTimeDataFrame",
905886
"makeTimeSeries",
906887
"maybe_produces_warning",
907888
"NARROW_NP_DTYPES",

pandas/conftest.py

+5-1
Original file line numberDiff line numberDiff line change
@@ -550,7 +550,11 @@ def multiindex_year_month_day_dataframe_random_data():
550550
DataFrame with 3 level MultiIndex (year, month, day) covering
551551
first 100 business days from 2000-01-01 with random data
552552
"""
553-
tdf = tm.makeTimeDataFrame(100)
553+
tdf = DataFrame(
554+
np.random.default_rng(2).standard_normal((100, 4)),
555+
columns=Index(list("ABCD"), dtype=object),
556+
index=date_range("2000-01-01", periods=100, freq="B"),
557+
)
554558
ymd = tdf.groupby([lambda x: x.year, lambda x: x.month, lambda x: x.day]).sum()
555559
# use int64 Index, to make sure things work
556560
ymd.index = ymd.index.set_levels([lev.astype("i8") for lev in ymd.index.levels])

pandas/tests/frame/conftest.py

+5-21
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,6 @@
77
NaT,
88
date_range,
99
)
10-
import pandas._testing as tm
1110

1211

1312
@pytest.fixture
@@ -16,27 +15,12 @@ def datetime_frame() -> DataFrame:
1615
Fixture for DataFrame of floats with DatetimeIndex
1716
1817
Columns are ['A', 'B', 'C', 'D']
19-
20-
A B C D
21-
2000-01-03 -1.122153 0.468535 0.122226 1.693711
22-
2000-01-04 0.189378 0.486100 0.007864 -1.216052
23-
2000-01-05 0.041401 -0.835752 -0.035279 -0.414357
24-
2000-01-06 0.430050 0.894352 0.090719 0.036939
25-
2000-01-07 -0.620982 -0.668211 -0.706153 1.466335
26-
2000-01-10 -0.752633 0.328434 -0.815325 0.699674
27-
2000-01-11 -2.236969 0.615737 -0.829076 -1.196106
28-
... ... ... ... ...
29-
2000-02-03 1.642618 -0.579288 0.046005 1.385249
30-
2000-02-04 -0.544873 -1.160962 -0.284071 -1.418351
31-
2000-02-07 -2.656149 -0.601387 1.410148 0.444150
32-
2000-02-08 -1.201881 -1.289040 0.772992 -1.445300
33-
2000-02-09 1.377373 0.398619 1.008453 -0.928207
34-
2000-02-10 0.473194 -0.636677 0.984058 0.511519
35-
2000-02-11 -0.965556 0.408313 -1.312844 -0.381948
36-
37-
[30 rows x 4 columns]
3818
"""
39-
return DataFrame(tm.getTimeSeriesData())
19+
return DataFrame(
20+
np.random.default_rng(2).standard_normal((100, 4)),
21+
columns=Index(list("ABCD"), dtype=object),
22+
index=date_range("2000-01-01", periods=100, freq="B"),
23+
)
4024

4125

4226
@pytest.fixture

pandas/tests/frame/indexing/test_indexing.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -584,7 +584,7 @@ def test_fancy_getitem_slice_mixed(
584584
tm.assert_frame_equal(float_frame, original)
585585

586586
def test_getitem_setitem_non_ix_labels(self):
587-
df = tm.makeTimeDataFrame()
587+
df = DataFrame(range(20), index=date_range("2020-01-01", periods=20))
588588

589589
start, end = df.index[[5, 10]]
590590

pandas/tests/frame/methods/test_cov_corr.py

+8-2
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,9 @@
66
import pandas as pd
77
from pandas import (
88
DataFrame,
9+
Index,
910
Series,
11+
date_range,
1012
isna,
1113
)
1214
import pandas._testing as tm
@@ -325,8 +327,12 @@ def test_corrwith(self, datetime_frame, dtype):
325327
tm.assert_almost_equal(correls[row], df1.loc[row].corr(df2.loc[row]))
326328

327329
def test_corrwith_with_objects(self):
328-
df1 = tm.makeTimeDataFrame()
329-
df2 = tm.makeTimeDataFrame()
330+
df1 = DataFrame(
331+
np.random.default_rng(2).standard_normal((10, 4)),
332+
columns=Index(list("ABCD"), dtype=object),
333+
index=date_range("2000-01-01", periods=10, freq="B"),
334+
)
335+
df2 = df1.copy()
330336
cols = ["A", "B", "C", "D"]
331337

332338
df1["obj"] = "foo"

pandas/tests/frame/methods/test_first_and_last.py

+23-4
Original file line numberDiff line numberDiff line change
@@ -1,12 +1,15 @@
11
"""
22
Note: includes tests for `last`
33
"""
4+
import numpy as np
45
import pytest
56

67
import pandas as pd
78
from pandas import (
89
DataFrame,
10+
Index,
911
bdate_range,
12+
date_range,
1013
)
1114
import pandas._testing as tm
1215

@@ -16,13 +19,21 @@
1619

1720
class TestFirst:
1821
def test_first_subset(self, frame_or_series):
19-
ts = tm.makeTimeDataFrame(freq="12h")
22+
ts = DataFrame(
23+
np.random.default_rng(2).standard_normal((100, 4)),
24+
columns=Index(list("ABCD"), dtype=object),
25+
index=date_range("2000-01-01", periods=100, freq="12h"),
26+
)
2027
ts = tm.get_obj(ts, frame_or_series)
2128
with tm.assert_produces_warning(FutureWarning, match=deprecated_msg):
2229
result = ts.first("10d")
2330
assert len(result) == 20
2431

25-
ts = tm.makeTimeDataFrame(freq="D")
32+
ts = DataFrame(
33+
np.random.default_rng(2).standard_normal((100, 4)),
34+
columns=Index(list("ABCD"), dtype=object),
35+
index=date_range("2000-01-01", periods=100, freq="D"),
36+
)
2637
ts = tm.get_obj(ts, frame_or_series)
2738
with tm.assert_produces_warning(FutureWarning, match=deprecated_msg):
2839
result = ts.first("10d")
@@ -64,13 +75,21 @@ def test_first_last_raises(self, frame_or_series):
6475
obj.last("1D")
6576

6677
def test_last_subset(self, frame_or_series):
67-
ts = tm.makeTimeDataFrame(freq="12h")
78+
ts = DataFrame(
79+
np.random.default_rng(2).standard_normal((100, 4)),
80+
columns=Index(list("ABCD"), dtype=object),
81+
index=date_range("2000-01-01", periods=100, freq="12h"),
82+
)
6883
ts = tm.get_obj(ts, frame_or_series)
6984
with tm.assert_produces_warning(FutureWarning, match=last_deprecated_msg):
7085
result = ts.last("10d")
7186
assert len(result) == 20
7287

73-
ts = tm.makeTimeDataFrame(nper=30, freq="D")
88+
ts = DataFrame(
89+
np.random.default_rng(2).standard_normal((30, 4)),
90+
columns=Index(list("ABCD"), dtype=object),
91+
index=date_range("2000-01-01", periods=30, freq="D"),
92+
)
7493
ts = tm.get_obj(ts, frame_or_series)
7594
with tm.assert_produces_warning(FutureWarning, match=last_deprecated_msg):
7695
result = ts.last("10d")

pandas/tests/frame/methods/test_truncate.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -60,7 +60,7 @@ def test_truncate(self, datetime_frame, frame_or_series):
6060
truncated = ts.truncate(before=ts.index[-1] + ts.index.freq)
6161
assert len(truncated) == 0
6262

63-
msg = "Truncate: 2000-01-06 00:00:00 must be after 2000-02-04 00:00:00"
63+
msg = "Truncate: 2000-01-06 00:00:00 must be after 2000-05-16 00:00:00"
6464
with pytest.raises(ValueError, match=msg):
6565
ts.truncate(
6666
before=ts.index[-1] - ts.index.freq, after=ts.index[0] + ts.index.freq

pandas/tests/frame/test_arithmetic.py

+6-2
Original file line numberDiff line numberDiff line change
@@ -1523,8 +1523,12 @@ def test_combineFunc(self, float_frame, mixed_float_frame):
15231523
[operator.eq, operator.ne, operator.lt, operator.gt, operator.ge, operator.le],
15241524
)
15251525
def test_comparisons(self, simple_frame, float_frame, func):
1526-
df1 = tm.makeTimeDataFrame()
1527-
df2 = tm.makeTimeDataFrame()
1526+
df1 = DataFrame(
1527+
np.random.default_rng(2).standard_normal((30, 4)),
1528+
columns=Index(list("ABCD"), dtype=object),
1529+
index=pd.date_range("2000-01-01", periods=30, freq="B"),
1530+
)
1531+
df2 = df1.copy()
15281532

15291533
row = simple_frame.xs("a")
15301534
ndim_5 = np.ones(df1.shape + (1, 1, 1))

pandas/tests/generic/test_generic.py

+39-9
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,9 @@
1010

1111
from pandas import (
1212
DataFrame,
13+
Index,
1314
Series,
15+
date_range,
1416
)
1517
import pandas._testing as tm
1618

@@ -328,12 +330,16 @@ def test_squeeze_series_noop(self, ser):
328330

329331
def test_squeeze_frame_noop(self):
330332
# noop
331-
df = tm.makeTimeDataFrame()
333+
df = DataFrame(np.eye(2))
332334
tm.assert_frame_equal(df.squeeze(), df)
333335

334336
def test_squeeze_frame_reindex(self):
335337
# squeezing
336-
df = tm.makeTimeDataFrame().reindex(columns=["A"])
338+
df = DataFrame(
339+
np.random.default_rng(2).standard_normal((10, 4)),
340+
columns=Index(list("ABCD"), dtype=object),
341+
index=date_range("2000-01-01", periods=10, freq="B"),
342+
).reindex(columns=["A"])
337343
tm.assert_series_equal(df.squeeze(), df["A"])
338344

339345
def test_squeeze_0_len_dim(self):
@@ -345,7 +351,11 @@ def test_squeeze_0_len_dim(self):
345351

346352
def test_squeeze_axis(self):
347353
# axis argument
348-
df = tm.makeTimeDataFrame(nper=1).iloc[:, :1]
354+
df = DataFrame(
355+
np.random.default_rng(2).standard_normal((1, 4)),
356+
columns=Index(list("ABCD"), dtype=object),
357+
index=date_range("2000-01-01", periods=1, freq="B"),
358+
).iloc[:, :1]
349359
assert df.shape == (1, 1)
350360
tm.assert_series_equal(df.squeeze(axis=0), df.iloc[0])
351361
tm.assert_series_equal(df.squeeze(axis="index"), df.iloc[0])
@@ -360,14 +370,22 @@ def test_squeeze_axis(self):
360370
df.squeeze(axis="x")
361371

362372
def test_squeeze_axis_len_3(self):
363-
df = tm.makeTimeDataFrame(3)
373+
df = DataFrame(
374+
np.random.default_rng(2).standard_normal((3, 4)),
375+
columns=Index(list("ABCD"), dtype=object),
376+
index=date_range("2000-01-01", periods=3, freq="B"),
377+
)
364378
tm.assert_frame_equal(df.squeeze(axis=0), df)
365379

366380
def test_numpy_squeeze(self):
367381
s = Series(range(2), dtype=np.float64)
368382
tm.assert_series_equal(np.squeeze(s), s)
369383

370-
df = tm.makeTimeDataFrame().reindex(columns=["A"])
384+
df = DataFrame(
385+
np.random.default_rng(2).standard_normal((10, 4)),
386+
columns=Index(list("ABCD"), dtype=object),
387+
index=date_range("2000-01-01", periods=10, freq="B"),
388+
).reindex(columns=["A"])
371389
tm.assert_series_equal(np.squeeze(df), df["A"])
372390

373391
@pytest.mark.parametrize(
@@ -382,11 +400,19 @@ def test_transpose_series(self, ser):
382400
tm.assert_series_equal(ser.transpose(), ser)
383401

384402
def test_transpose_frame(self):
385-
df = tm.makeTimeDataFrame()
403+
df = DataFrame(
404+
np.random.default_rng(2).standard_normal((10, 4)),
405+
columns=Index(list("ABCD"), dtype=object),
406+
index=date_range("2000-01-01", periods=10, freq="B"),
407+
)
386408
tm.assert_frame_equal(df.transpose().transpose(), df)
387409

388410
def test_numpy_transpose(self, frame_or_series):
389-
obj = tm.makeTimeDataFrame()
411+
obj = DataFrame(
412+
np.random.default_rng(2).standard_normal((10, 4)),
413+
columns=Index(list("ABCD"), dtype=object),
414+
index=date_range("2000-01-01", periods=10, freq="B"),
415+
)
390416
obj = tm.get_obj(obj, frame_or_series)
391417

392418
if frame_or_series is Series:
@@ -419,7 +445,11 @@ def test_take_series(self, ser):
419445

420446
def test_take_frame(self):
421447
indices = [1, 5, -2, 6, 3, -1]
422-
df = tm.makeTimeDataFrame()
448+
df = DataFrame(
449+
np.random.default_rng(2).standard_normal((10, 4)),
450+
columns=Index(list("ABCD"), dtype=object),
451+
index=date_range("2000-01-01", periods=10, freq="B"),
452+
)
423453
out = df.take(indices)
424454
expected = DataFrame(
425455
data=df.values.take(indices, axis=0),
@@ -431,7 +461,7 @@ def test_take_frame(self):
431461
def test_take_invalid_kwargs(self, frame_or_series):
432462
indices = [-3, 2, 0, 1]
433463

434-
obj = tm.makeTimeDataFrame()
464+
obj = DataFrame(range(5))
435465
obj = tm.get_obj(obj, frame_or_series)
436466

437467
msg = r"take\(\) got an unexpected keyword argument 'foo'"

pandas/tests/groupby/aggregate/test_aggregate.py

+5-1
Original file line numberDiff line numberDiff line change
@@ -161,7 +161,11 @@ def test_agg_apply_corner(ts, tsframe):
161161

162162

163163
def test_agg_grouping_is_list_tuple(ts):
164-
df = tm.makeTimeDataFrame()
164+
df = DataFrame(
165+
np.random.default_rng(2).standard_normal((30, 4)),
166+
columns=Index(list("ABCD"), dtype=object),
167+
index=pd.date_range("2000-01-01", periods=30, freq="B"),
168+
)
165169

166170
grouped = df.groupby(lambda x: x.year)
167171
grouper = grouped.grouper.groupings[0].grouping_vector

pandas/tests/groupby/conftest.py

+10-2
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,11 @@
11
import numpy as np
22
import pytest
33

4-
from pandas import DataFrame
4+
from pandas import (
5+
DataFrame,
6+
Index,
7+
date_range,
8+
)
59
import pandas._testing as tm
610
from pandas.core.groupby.base import (
711
reduction_kernels,
@@ -48,7 +52,11 @@ def ts():
4852

4953
@pytest.fixture
5054
def tsframe():
51-
return DataFrame(tm.getTimeSeriesData())
55+
return DataFrame(
56+
np.random.default_rng(2).standard_normal((30, 4)),
57+
columns=Index(list("ABCD"), dtype=object),
58+
index=date_range("2000-01-01", periods=30, freq="B"),
59+
)
5260

5361

5462
@pytest.fixture

0 commit comments

Comments
 (0)