Skip to content

Backport PR #45706: BUG: Frame.iat item_cache invalidation bug #45744

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Merged
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions doc/source/whatsnew/v1.4.1.rst
Original file line number Diff line number Diff line change
Expand Up @@ -17,6 +17,7 @@ Fixed regressions
- Regression in :meth:`Series.mask` with ``inplace=True`` and ``PeriodDtype`` and an incompatible ``other`` coercing to a common dtype instead of raising (:issue:`45546`)
- Regression in :func:`.assert_frame_equal` not respecting ``check_flags=False`` (:issue:`45554`)
- Regression in :meth:`Series.fillna` with ``downcast=False`` incorrectly downcasting ``object`` dtype (:issue:`45603`)
- Regression in :meth:`DataFrame.iat` setting values leading to not propagating correctly in subsequent lookups (:issue:`45684`)
- Regression when setting values with :meth:`DataFrame.loc` losing :class:`Index` name if :class:`DataFrame` was empty before (:issue:`45621`)
- Regression in :meth:`~Index.join` with overlapping :class:`IntervalIndex` raising an ``InvalidIndexError`` (:issue:`45661`)
- Regression in :func:`read_sql` with a DBAPI2 connection that is not an instance of ``sqlite3.Connection`` incorrectly requiring SQLAlchemy be installed (:issue:`45660`)
Expand Down
8 changes: 8 additions & 0 deletions pandas/conftest.py
Original file line number Diff line number Diff line change
Expand Up @@ -1757,6 +1757,14 @@ def indexer_al(request):
return request.param


@pytest.fixture(params=[tm.iat, tm.iloc])
def indexer_ial(request):
"""
Parametrize over iat.__setitem__, iloc.__setitem__
"""
return request.param


@pytest.fixture
def using_array_manager(request):
"""
Expand Down
24 changes: 8 additions & 16 deletions pandas/core/frame.py
Original file line number Diff line number Diff line change
Expand Up @@ -93,7 +93,6 @@
)

from pandas.core.dtypes.cast import (
can_hold_element,
construct_1d_arraylike_from_scalar,
construct_2d_arraylike_from_scalar,
find_common_type,
Expand Down Expand Up @@ -3864,23 +3863,16 @@ def _set_value(
try:
if takeable:
series = self._ixs(col, axis=1)
series._set_value(index, value, takeable=True)
return

series = self._get_item_cache(col)
loc = self.index.get_loc(index)
dtype = series.dtype
if isinstance(dtype, np.dtype) and dtype.kind not in ["m", "M"]:
# otherwise we have EA values, and this check will be done
# via setitem_inplace
if not can_hold_element(series._values, value):
# We'll go through loc and end up casting.
raise TypeError
loc = index
else:
series = self._get_item_cache(col)
loc = self.index.get_loc(index)

# setitem_inplace will do validation that may raise TypeError
# or ValueError
series._mgr.setitem_inplace(loc, value)
# Note: trying to use series._set_value breaks tests in
# tests.frame.indexing.test_indexing and tests.indexing.test_partial
except (KeyError, TypeError):

except (KeyError, TypeError, ValueError):
# set using a non-recursive method & reset the cache
if takeable:
self.iloc[index, col] = value
Expand Down
15 changes: 14 additions & 1 deletion pandas/core/internals/base.py
Original file line number Diff line number Diff line change
Expand Up @@ -9,14 +9,19 @@
final,
)

import numpy as np

from pandas._typing import (
ArrayLike,
DtypeObj,
Shape,
)
from pandas.errors import AbstractMethodError

from pandas.core.dtypes.cast import find_common_type
from pandas.core.dtypes.cast import (
find_common_type,
np_can_hold_element,
)

from pandas.core.base import PandasObject
from pandas.core.indexes.api import (
Expand Down Expand Up @@ -174,6 +179,14 @@ def setitem_inplace(self, indexer, value) -> None:
in place, not returning a new Manager (and Block), and thus never changing
the dtype.
"""
arr = self.array

# EAs will do this validation in their own __setitem__ methods.
if isinstance(arr, np.ndarray):
# Note: checking for ndarray instead of np.dtype means we exclude
# dt64/td64, which do their own validation.
value = np_can_hold_element(arr.dtype, value)

self.array[indexer] = value

def grouped_reduce(self, func, ignore_failures: bool = False):
Expand Down
17 changes: 17 additions & 0 deletions pandas/tests/indexing/test_iat.py
Original file line number Diff line number Diff line change
Expand Up @@ -29,3 +29,20 @@ def test_iat_getitem_series_with_period_index():
expected = ser[index[0]]
result = ser.iat[0]
assert expected == result


def test_iat_setitem_item_cache_cleared(indexer_ial):
# GH#45684
data = {"x": np.arange(8, dtype=np.int64), "y": np.int64(0)}
df = DataFrame(data).copy()
ser = df["y"]

# previously this iat setting would split the block and fail to clear
# the item_cache.
indexer_ial(df)[7, 0] = 9999

indexer_ial(df)[7, 1] = 1234

assert df.iat[7, 1] == 1234
assert ser.iloc[-1] == 1234
assert df.iloc[-1, -1] == 1234