pandas-dev · jreback · Jan 10, 2021 · Jan 9, 2021 · Jan 9, 2021 · Jan 9, 2021
diff --git a/doc/source/whatsnew/v1.2.1.rst b/doc/source/whatsnew/v1.2.1.rst
@@ -26,6 +26,7 @@ Fixed regressions
 - Bug in :meth:`read_csv` with ``float_precision="high"`` caused segfault or wrong parsing of long exponent strings. This resulted in a regression in some cases as the default for ``float_precision`` was changed in pandas 1.2.0 (:issue:`38753`)
 - Fixed regression in :meth:`Rolling.skew` and :meth:`Rolling.kurt` modifying the object inplace (:issue:`38908`)
 - Fixed regression in :meth:`read_csv` and other read functions were the encoding error policy (``errors``) did not default to ``"replace"`` when no encoding was specified (:issue:`38989`)
+- Fixed regression in :meth:`DataFrameGroupBy.diff` raising for ``int8`` and ``int16`` columns (:issue:`39050`)
 
 .. ---------------------------------------------------------------------------
 

diff --git a/pandas/core/algorithms.py b/pandas/core/algorithms.py
@@ -1991,7 +1991,11 @@ def diff(arr, n: int, axis: int = 0, stacklevel=3):
 
     elif is_integer_dtype(dtype):
         # We have to cast in order to be able to hold np.nan
-        dtype = np.float64
+        # int8, int16 are incompatible with float64
 # Disable for unsupported dtype combinations, 
 #  see https://github.com/cython/cython/issues/2646 
 if (out_t is float32_t 
         and not (diff_t is float32_t or diff_t is int8_t or diff_t is int16_t)): 
     raise NotImplementedError 
 elif (out_t is float64_t 
       and (diff_t is float32_t or diff_t is int8_t or diff_t is int16_t)): 
     raise NotImplementedError 
 # Disable for unsupported dtype combinations, 
 #  see https://github.com/cython/cython/issues/2646 
 if (out_t is float32_t 
         and not (diff_t is float32_t or diff_t is int8_t or diff_t is int16_t)): 
     raise NotImplementedError 
 elif (out_t is float64_t 
       and (diff_t is float32_t or diff_t is int8_t or diff_t is int16_t)): 
     raise NotImplementedError 
+        if arr.dtype.name in ["int8", "int16"]:
+            dtype = np.float32
+        else:
+            dtype = np.float64
 
     orig_ndim = arr.ndim
     if orig_ndim == 1:

diff --git a/pandas/tests/test_algos.py b/pandas/tests/test_algos.py
@@ -2409,3 +2409,10 @@ def test_diff_ea_axis(self):
         msg = "cannot diff DatetimeArray on axis=1"
         with pytest.raises(ValueError, match=msg):
             algos.diff(dta, 1, axis=1)
+
+    @pytest.mark.parametrize("dtype", ["int8", "int16"])
+    def test_diff_low_precision_int(self, dtype):
+        arr = np.array([0, 1, 1, 0, 0], dtype=dtype)
+        result = algos.diff(arr, 1)
+        expected = np.array([np.nan, 1, 0, -1, 0], dtype="float32")
+        tm.assert_numpy_array_equal(result, expected)