Make C engine the same as python parser engine

kprestel · kprestel · commit 856753c4882b · 2018-12-01T13:26:19.000-05:00
diff --git a/pandas/_libs/parsers.pyx b/pandas/_libs/parsers.pyx
@@ -56,8 +56,10 @@ from pandas.core.arrays import Categorical
 from pandas.core.dtypes.concat import union_categoricals
 import pandas.io.common as icom
 
-from pandas.errors import (ParserError, DtypeWarning,
-                           EmptyDataError, ParserWarning)
+from pandas.errors import (
+    ParserError, DtypeWarning,
+    EmptyDataError, ParserWarning, AbstractMethodError,
+)
 
 # Import CParserError as alias of ParserError for backwards compatibility.
 # Ultimately, we want to remove this import. See gh-12665 and gh-14479.
@@ -1232,10 +1234,16 @@ cdef class TextReader:
             if result is not None and dtype != 'int64':
                 if is_extension_array_dtype(dtype):
                     try:
-                        result = dtype.construct_array_type()._from_sequence(
-                                result, dtype=dtype)
-                    except Exception as e:
-                        raise
+                        array_type = dtype.construct_array_type()
+                    except AttributeError:
+                        dtype = pandas_dtype(dtype)
+                        array_type = dtype.construct_array_type()
+                    try:
+                        # use _from_sequence_of_strings if the class defines it
+                        return array_type._from_sequence_of_strings(result,
+                                                                    dtype=dtype) # noqa
+                    except AbstractMethodError:
+                        return array_type._from_sequence(result, dtype=dtype)
                 else:
                     result = result.astype(dtype)
 
@@ -1248,14 +1256,19 @@ cdef class TextReader:
             if result is not None and dtype != 'float64':
                 if is_extension_array_dtype(dtype):
                     try:
-                        result = dtype.construct_array_type()._from_sequence(
-                                result)
-                    except Exception as e:
-                        raise
+                        array_type = dtype.construct_array_type()
+                    except AttributeError:
+                        dtype = pandas_dtype(dtype)
+                        array_type = dtype.construct_array_type()
+                    try:
+                        # use _from_sequence_of_strings if the class defines it
+                        return array_type._from_sequence_of_strings(result,
+                                                                    dtype=dtype) # noqa
+                    except AbstractMethodError:
+                        return array_type._from_sequence(result, dtype=dtype)
                 else:
                     result = result.astype(dtype)
             return result, na_count
-
         elif is_bool_dtype(dtype):
             result, na_count = _try_bool_flex(self.parser, i, start, end,
                                               na_filter, na_hashset,
diff --git a/pandas/core/series.py b/pandas/core/series.py
@@ -4354,7 +4354,8 @@ def _try_cast(arr, take_fast_path):
             subarr = np.array(data, copy=False)
 
             # possibility of nan -> garbage
-            if is_float_dtype(data.dtype) and is_integer_dtype(dtype):
+            if is_float_dtype(data.dtype) and is_integer_dtype(dtype) \
+                    and not is_extension_array_dtype(dtype):
                 if not isna(data).any():
                     subarr = _try_cast(data, True)
                 elif copy:
diff --git a/pandas/tests/extension/base/__init__.py b/pandas/tests/extension/base/__init__.py
@@ -52,3 +52,4 @@ class TestMyDtype(BaseDtypeTests):
 from .missing import BaseMissingTests  # noqa
 from .reshaping import BaseReshapingTests  # noqa
 from .setitem import BaseSetitemTests  # noqa
+from .io import ExtensionParsingTests  # noqa