|
| 1 | +import numpy as np |
| 2 | +import pytest |
| 3 | + |
| 4 | +from pandas import ( |
| 5 | + PeriodIndex, |
| 6 | + Series, |
| 7 | + date_range, |
| 8 | + period_range, |
| 9 | + timedelta_range, |
| 10 | +) |
| 11 | +import pandas._testing as tm |
| 12 | + |
| 13 | + |
| 14 | +class DropDuplicates: |
| 15 | + def test_drop_duplicates_metadata(self, idx): |
| 16 | + # GH#10115 |
| 17 | + result = idx.drop_duplicates() |
| 18 | + tm.assert_index_equal(idx, result) |
| 19 | + assert idx.freq == result.freq |
| 20 | + |
| 21 | + idx_dup = idx.append(idx) |
| 22 | + result = idx_dup.drop_duplicates() |
| 23 | + |
| 24 | + expected = idx |
| 25 | + if not isinstance(idx, PeriodIndex): |
| 26 | + # freq is reset except for PeriodIndex |
| 27 | + assert idx_dup.freq is None |
| 28 | + assert result.freq is None |
| 29 | + expected = idx._with_freq(None) |
| 30 | + else: |
| 31 | + assert result.freq == expected.freq |
| 32 | + |
| 33 | + tm.assert_index_equal(result, expected) |
| 34 | + |
| 35 | + @pytest.mark.parametrize( |
| 36 | + "keep, expected, index", |
| 37 | + [ |
| 38 | + ("first", np.concatenate(([False] * 10, [True] * 5)), np.arange(0, 10)), |
| 39 | + ("last", np.concatenate(([True] * 5, [False] * 10)), np.arange(5, 15)), |
| 40 | + ( |
| 41 | + False, |
| 42 | + np.concatenate(([True] * 5, [False] * 5, [True] * 5)), |
| 43 | + np.arange(5, 10), |
| 44 | + ), |
| 45 | + ], |
| 46 | + ) |
| 47 | + def test_drop_duplicates(self, keep, expected, index, idx): |
| 48 | + # to check Index/Series compat |
| 49 | + idx = idx.append(idx[:5]) |
| 50 | + |
| 51 | + tm.assert_numpy_array_equal(idx.duplicated(keep=keep), expected) |
| 52 | + expected = idx[~expected] |
| 53 | + |
| 54 | + result = idx.drop_duplicates(keep=keep) |
| 55 | + tm.assert_index_equal(result, expected) |
| 56 | + |
| 57 | + result = Series(idx).drop_duplicates(keep=keep) |
| 58 | + tm.assert_series_equal(result, Series(expected, index=index)) |
| 59 | + |
| 60 | + |
| 61 | +class TestDropDuplicatesPeriodIndex(DropDuplicates): |
| 62 | + @pytest.fixture(params=["D", "3D", "H", "2H", "T", "2T", "S", "3S"]) |
| 63 | + def freq(self, request): |
| 64 | + return request.param |
| 65 | + |
| 66 | + @pytest.fixture |
| 67 | + def idx(self, freq): |
| 68 | + return period_range("2011-01-01", periods=10, freq=freq, name="idx") |
| 69 | + |
| 70 | + |
| 71 | +class TestDropDuplicatesDatetimeIndex(DropDuplicates): |
| 72 | + @pytest.fixture |
| 73 | + def idx(self, freq_sample): |
| 74 | + return date_range("2011-01-01", freq=freq_sample, periods=10, name="idx") |
| 75 | + |
| 76 | + |
| 77 | +class TestDropDuplicatesTimedeltaIndex(DropDuplicates): |
| 78 | + @pytest.fixture |
| 79 | + def idx(self, freq_sample): |
| 80 | + return timedelta_range("1 day", periods=10, freq=freq_sample, name="idx") |
0 commit comments