|
| 1 | +from typing import TYPE_CHECKING, List, Tuple |
| 2 | + |
| 3 | +import numpy as np |
| 4 | + |
| 5 | +from pandas._typing import ArrayLike |
| 6 | + |
| 7 | +if TYPE_CHECKING: |
| 8 | + from pandas.core.internals.blocks import Block # noqa:F401 |
| 9 | + |
| 10 | + |
| 11 | +def operate_blockwise(left, right, array_op): |
| 12 | + # At this point we have already checked |
| 13 | + # assert right._indexed_same(left) |
| 14 | + |
| 15 | + res_blks: List["Block"] = [] |
| 16 | + rmgr = right._mgr |
| 17 | + for n, blk in enumerate(left._mgr.blocks): |
| 18 | + locs = blk.mgr_locs |
| 19 | + blk_vals = blk.values |
| 20 | + |
| 21 | + left_ea = not isinstance(blk_vals, np.ndarray) |
| 22 | + |
| 23 | + rblks = rmgr._slice_take_blocks_ax0(locs.indexer, only_slice=True) |
| 24 | + |
| 25 | + # Assertions are disabled for performance, but should hold: |
| 26 | + # if left_ea: |
| 27 | + # assert len(locs) == 1, locs |
| 28 | + # assert len(rblks) == 1, rblks |
| 29 | + # assert rblks[0].shape[0] == 1, rblks[0].shape |
| 30 | + |
| 31 | + for k, rblk in enumerate(rblks): |
| 32 | + right_ea = not isinstance(rblk.values, np.ndarray) |
| 33 | + |
| 34 | + lvals, rvals = _get_same_shape_values(blk, rblk, left_ea, right_ea) |
| 35 | + |
| 36 | + res_values = array_op(lvals, rvals) |
| 37 | + if left_ea and not right_ea and hasattr(res_values, "reshape"): |
| 38 | + res_values = res_values.reshape(1, -1) |
| 39 | + nbs = rblk._split_op_result(res_values) |
| 40 | + |
| 41 | + # Assertions are disabled for performance, but should hold: |
| 42 | + # if right_ea or left_ea: |
| 43 | + # assert len(nbs) == 1 |
| 44 | + # else: |
| 45 | + # assert res_values.shape == lvals.shape, (res_values.shape, lvals.shape) |
| 46 | + |
| 47 | + _reset_block_mgr_locs(nbs, locs) |
| 48 | + |
| 49 | + res_blks.extend(nbs) |
| 50 | + |
| 51 | + # Assertions are disabled for performance, but should hold: |
| 52 | + # slocs = {y for nb in res_blks for y in nb.mgr_locs.as_array} |
| 53 | + # nlocs = sum(len(nb.mgr_locs.as_array) for nb in res_blks) |
| 54 | + # assert nlocs == len(left.columns), (nlocs, len(left.columns)) |
| 55 | + # assert len(slocs) == nlocs, (len(slocs), nlocs) |
| 56 | + # assert slocs == set(range(nlocs)), slocs |
| 57 | + |
| 58 | + new_mgr = type(rmgr)(res_blks, axes=rmgr.axes, do_integrity_check=False) |
| 59 | + return new_mgr |
| 60 | + |
| 61 | + |
| 62 | +def _reset_block_mgr_locs(nbs: List["Block"], locs): |
| 63 | + """ |
| 64 | + Reset mgr_locs to correspond to our original DataFrame. |
| 65 | + """ |
| 66 | + for nb in nbs: |
| 67 | + nblocs = locs.as_array[nb.mgr_locs.indexer] |
| 68 | + nb.mgr_locs = nblocs |
| 69 | + # Assertions are disabled for performance, but should hold: |
| 70 | + # assert len(nblocs) == nb.shape[0], (len(nblocs), nb.shape) |
| 71 | + # assert all(x in locs.as_array for x in nb.mgr_locs.as_array) |
| 72 | + |
| 73 | + |
| 74 | +def _get_same_shape_values( |
| 75 | + lblk: "Block", rblk: "Block", left_ea: bool, right_ea: bool |
| 76 | +) -> Tuple[ArrayLike, ArrayLike]: |
| 77 | + """ |
| 78 | + Slice lblk.values to align with rblk. Squeeze if we have EAs. |
| 79 | + """ |
| 80 | + lvals = lblk.values |
| 81 | + rvals = rblk.values |
| 82 | + |
| 83 | + # Require that the indexing into lvals be slice-like |
| 84 | + assert rblk.mgr_locs.is_slice_like, rblk.mgr_locs |
| 85 | + |
| 86 | + # TODO(EA2D): with 2D EAs pnly this first clause would be needed |
| 87 | + if not (left_ea or right_ea): |
| 88 | + lvals = lvals[rblk.mgr_locs.indexer, :] |
| 89 | + assert lvals.shape == rvals.shape, (lvals.shape, rvals.shape) |
| 90 | + elif left_ea and right_ea: |
| 91 | + assert lvals.shape == rvals.shape, (lvals.shape, rvals.shape) |
| 92 | + elif right_ea: |
| 93 | + # lvals are 2D, rvals are 1D |
| 94 | + lvals = lvals[rblk.mgr_locs.indexer, :] |
| 95 | + assert lvals.shape[0] == 1, lvals.shape |
| 96 | + lvals = lvals[0, :] |
| 97 | + else: |
| 98 | + # lvals are 1D, rvals are 2D |
| 99 | + assert rvals.shape[0] == 1, rvals.shape |
| 100 | + rvals = rvals[0, :] |
| 101 | + |
| 102 | + return lvals, rvals |
0 commit comments