TST: do not skip a test when fewer then all readers is installed

davidovitch · davidovitch · commit 3dc73bfb70d6 · 2015-03-15T18:38:44.000+01:00
diff --git a/pandas/io/tests/test_excel.py b/pandas/io/tests/test_excel.py
@@ -60,7 +60,7 @@ def _skip_if_no_xlsxwriter():
 
 def _skip_if_no_ezodf():
     try:
-        import ezodf
+        import ezodf  # NOQA
     except ImportError:
         raise nose.SkipTest('ezodf not installed, skipping')
 
@@ -94,6 +94,27 @@ def setUp(self):
         self.frame2 = _frame2.copy()
         self.tsframe = _tsframe.copy()
         self.mixed_frame = _mixed_frame.copy()
+        self.readers2test()
+
+    def readers2test(self):
+        self.suffix2test = []
+        try:
+            _skip_if_no_ezodf()
+            self.suffix2test.append('ods')
+        except nose.SkipTest:
+            pass
+        try:
+            _skip_if_no_xlrd()
+            self.suffix2test.append('xls')
+        except nose.SkipTest:
+            pass
+        try:
+            _skip_if_no_openpyxl()
+            self.suffix2test.append('xlsm')
+            self.suffix2test.append('xlsx')
+        except nose.SkipTest:
+            pass
+        self.suffix2test = frozenset(self.suffix2test)
 
     def read_csv(self, *args, **kwds):
         kwds = kwds.copy()
@@ -103,11 +124,10 @@ def read_csv(self, *args, **kwds):
 
 class ExcelReaderTests(SharedItems, tm.TestCase):
     def test_parse_cols_int(self):
-        _skip_if_no_openpyxl()
-        _skip_if_no_xlrd()
-        _skip_if_no_ezodf()
 
-        suffix = ['xls', 'xlsx', 'xlsm', 'ods']
+        suffix = set(['xls', 'xlsx', 'xlsm', 'ods']) & self.suffix2test
+        if len(suffix) < 1:
+            raise nose.SkipTest('no spreadsheet readers installed, skipping')
 
         for s in suffix:
             pth = os.path.join(self.dirpath, 'test.%s' % s)
@@ -123,11 +143,10 @@ def test_parse_cols_int(self):
             tm.assert_frame_equal(df3, df2, check_names=False)
 
     def test_parse_cols_list(self):
-        _skip_if_no_openpyxl()
-        _skip_if_no_xlrd()
-        _skip_if_no_ezodf()
 
-        suffix = ['xls', 'xlsx', 'xlsm', 'ods']
+        suffix = set(['xls', 'xlsx', 'xlsm', 'ods']) & self.suffix2test
+        if len(suffix) < 1:
+            raise nose.SkipTest('no spreadsheet readers installed, skipping')
 
         for s in suffix:
             pth = os.path.join(self.dirpath, 'test.%s' % s)
@@ -144,11 +163,10 @@ def test_parse_cols_list(self):
             tm.assert_frame_equal(df3, df2, check_names=False)
 
     def test_parse_cols_str(self):
-        _skip_if_no_openpyxl()
-        _skip_if_no_xlrd()
-        _skip_if_no_ezodf()
 
-        suffix = ['xls', 'xlsx', 'xlsm', 'ods']
+        suffix = set(['xls', 'xlsx', 'xlsm', 'ods']) & self.suffix2test
+        if len(suffix) < 1:
+            raise nose.SkipTest('no spreadsheet readers installed, skipping')
 
         for s in suffix:
 
@@ -189,10 +207,9 @@ def test_parse_cols_str(self):
             tm.assert_frame_equal(df3, df2, check_names=False)
 
     def test_excel_stop_iterator(self):
-        _skip_if_no_xlrd()
-        _skip_if_no_ezodf()
-
-        suffix = ['xls', 'ods']
+        suffix = set(['xls', 'ods']) & self.suffix2test
+        if len(suffix) < 1:
+            raise nose.SkipTest('no spreadsheet readers installed, skipping')
 
         for s in suffix:
             excel_data = ExcelFile(os.path.join(self.dirpath, 'test2.%s' % s))
@@ -201,28 +218,34 @@ def test_excel_stop_iterator(self):
             tm.assert_frame_equal(parsed, expected)
 
     def test_excel_cell_error_na(self):
-        _skip_if_no_xlrd()
+        suffix = set(['xls', 'ods']) & self.suffix2test
+        if len(suffix) < 1:
+            raise nose.SkipTest('no spreadsheet readers installed, skipping')
 
-        excel_data = ExcelFile(os.path.join(self.dirpath, 'test3.xls'))
-        parsed = excel_data.parse('Sheet1')
-        expected = DataFrame([[np.nan]], columns=['Test'])
-        tm.assert_frame_equal(parsed, expected)
+        for s in suffix:
+            excel_data = ExcelFile(os.path.join(self.dirpath, 'test3.%s' % s))
+            parsed = excel_data.parse('Sheet1')
+            expected = DataFrame([[np.nan]], columns=['Test'])
+            tm.assert_frame_equal(parsed, expected)
 
     def test_excel_passes_na(self):
-        _skip_if_no_xlrd()
+        suffix = set(['xlsx', 'ods']) & self.suffix2test
+        if len(suffix) < 1:
+            raise nose.SkipTest('no spreadsheet readers installed, skipping')
 
-        excel_data = ExcelFile(os.path.join(self.dirpath, 'test2.xlsx'))
-        parsed = excel_data.parse('Sheet1', keep_default_na=False,
-                                  na_values=['apple'])
-        expected = DataFrame([['NA'], [1], ['NA'], [np.nan], ['rabbit']],
-                             columns=['Test'])
-        tm.assert_frame_equal(parsed, expected)
+        for s in suffix:
+            excel_data = ExcelFile(os.path.join(self.dirpath, 'test4.%s' % s))
+            parsed = excel_data.parse('Sheet1', keep_default_na=False,
+                                      na_values=['apple'])
+            expected = DataFrame([['NA'], [1], ['NA'], [np.nan], ['rabbit']],
+                                 columns=['Test'])
+            tm.assert_frame_equal(parsed, expected)
 
-        parsed = excel_data.parse('Sheet1', keep_default_na=True,
-                                  na_values=['apple'])
-        expected = DataFrame([[np.nan], [1], [np.nan], [np.nan], ['rabbit']],
-                             columns=['Test'])
-        tm.assert_frame_equal(parsed, expected)
+            parsed = excel_data.parse('Sheet1', keep_default_na=True,
+                                      na_values=['apple'])
+            expected = DataFrame([[np.nan], [1], [np.nan], [np.nan], ['rabbit']],
+                                 columns=['Test'])
+            tm.assert_frame_equal(parsed, expected)
 
     def check_excel_table_sheet_by_index(self, filename, csvfile):
 
@@ -255,11 +278,9 @@ def test_excel_table_sheet_by_index(self):
             self.check_excel_table_sheet_by_index(filename, csvfile)
 
     def test_excel_table(self):
-        _skip_if_no_xlrd()
-        _skip_if_no_openpyxl()
-        _skip_if_no_ezodf()
-
-        suffix = ['xls', 'xlsx', 'ods']
+        suffix = set(['xls', 'xlsx', 'ods']) & self.suffix2test
+        if len(suffix) < 1:
+            raise nose.SkipTest('no spreadsheet readers installed, skipping')
 
         for s in suffix:
 
@@ -281,19 +302,16 @@ def test_excel_table(self):
             tm.assert_frame_equal(df4, df5)
 
     def test_excel_read_buffer(self):
-        _skip_if_no_xlrd()
-        _skip_if_no_openpyxl()
+        suffix = set(['xls', 'xlsx']) & self.suffix2test
+        if len(suffix) < 1:
+            raise nose.SkipTest('no spreadsheet readers installed, skipping')
 
-        pth = os.path.join(self.dirpath, 'test.xls')
-        f = open(pth, 'rb')
-        xls = ExcelFile(f)
-        # it works
-        xls.parse('Sheet1', index_col=0, parse_dates=True)
-
-        pth = os.path.join(self.dirpath, 'test.xlsx')
-        f = open(pth, 'rb')
-        xl = ExcelFile(f)
-        xl.parse('Sheet1', index_col=0, parse_dates=True)
+        for s in suffix:
+            pth = os.path.join(self.dirpath, 'test.%s' % s)
+            f = open(pth, 'rb')
+            xls = ExcelFile(f)
+            # it works
+            xls.parse('Sheet1', index_col=0, parse_dates=True)
 
     def test_read_xlrd_Book(self):
         _skip_if_no_xlrd()
@@ -380,9 +398,10 @@ def test_reader_closes_file(self):
         self.assertTrue(f.closed)
 
     def test_reader_special_dtypes(self):
-        _skip_if_no_xlrd()
-        _skip_if_no_openpyxl()
-        _skip_if_no_ezodf()
+
+        suffix = set(['xls', 'xlsx', 'ods']) & self.suffix2test
+        if len(suffix) < 1:
+            raise nose.SkipTest('no spreadsheet readers installed, skipping')
 
         expected = DataFrame.from_items([
             ("IntCol", [1, 2, -3, 4, 0]),
@@ -396,49 +415,50 @@ def test_reader_special_dtypes(self):
                          datetime(2015, 3, 14)])
         ])
 
-        xlsx_path = os.path.join(self.dirpath, 'test_types.xlsx')
-        xls_path = os.path.join(self.dirpath, 'test_types.xls')
-        ods_path = os.path.join(self.dirpath, 'test_types.ods')
-
         # should read in correctly and infer types
-        for path in (xls_path, xlsx_path, ods_path):
+        for s in suffix:
+            path = os.path.join(self.dirpath, 'test_types.%s' %s)
             actual = read_excel(path, 'Sheet1')
             tm.assert_frame_equal(actual, expected)
 
         # if not coercing number, then int comes in as float
         float_expected = expected.copy()
         float_expected["IntCol"] = float_expected["IntCol"].astype(float)
         float_expected.loc[1, "Str2Col"] = 3.0
-        for path in (xls_path, xlsx_path, ods_path):
+        for s in suffix:
+            path = os.path.join(self.dirpath, 'test_types.%s' %s)
             actual = read_excel(path, 'Sheet1', convert_float=False)
             tm.assert_frame_equal(actual, float_expected)
 
         # check setting Index (assuming xls and xlsx are the same here)
-        for icol, name in enumerate(expected.columns):
-            actual = read_excel(xlsx_path, 'Sheet1', index_col=icol)
-            actual2 = read_excel(xlsx_path, 'Sheet1', index_col=name)
-            actual3 = read_excel(ods_path, 'Sheet1', index_col=name)
-            exp = expected.set_index(name)
-            tm.assert_frame_equal(actual, exp)
-            tm.assert_frame_equal(actual2, exp)
-            tm.assert_frame_equal(actual3, exp)
+        for s in suffix:
+            path = os.path.join(self.dirpath, 'test_types.%s' %s)
+            for icol, name in enumerate(expected.columns):
+                actual = read_excel(path, 'Sheet1', index_col=icol)
+                exp = expected.set_index(name)
+                tm.assert_frame_equal(actual, exp)
 
         # convert_float and converters should be different but both accepted
-        expected["StrCol"] = expected["StrCol"].apply(str)
-        actual = read_excel(xlsx_path, 'Sheet1', converters={"StrCol": str})
-        tm.assert_frame_equal(actual, expected)
+        for s in suffix:
+            path = os.path.join(self.dirpath, 'test_types.%s' %s)
+            expected["StrCol"] = expected["StrCol"].apply(str)
+            actual = read_excel(path, 'Sheet1', converters={"StrCol": str})
+            tm.assert_frame_equal(actual, expected)
 
-        no_convert_float = float_expected.copy()
-        no_convert_float["StrCol"] = no_convert_float["StrCol"].apply(str)
-        actual = read_excel(xlsx_path, 'Sheet1', converters={"StrCol": str},
-                           convert_float=False)
-        tm.assert_frame_equal(actual, no_convert_float)
+        for s in suffix:
+            path = os.path.join(self.dirpath, 'test_types.%s' %s)
+            no_convert_float = float_expected.copy()
+            no_convert_float["StrCol"] = no_convert_float["StrCol"].apply(str)
+            actual = read_excel(path, 'Sheet1', converters={"StrCol": str},
+                               convert_float=False)
+            tm.assert_frame_equal(actual, no_convert_float)
 
     # GH8212 - support for converters and missing values
     def test_reader_converters(self):
-        _skip_if_no_xlrd()
-        _skip_if_no_openpyxl()
-        _skip_if_no_ezodf()
+
+        suffix = set(['xls', 'xlsx', 'ods']) & self.suffix2test
+        if len(suffix) < 1:
+            raise nose.SkipTest('no spreadsheet readers installed, skipping')
 
         expected = DataFrame.from_items([
             ("IntCol", [1, 2, -3, -1000, 0]),
@@ -453,12 +473,9 @@ def test_reader_converters(self):
                       3: lambda x: str(x) if x else '',
                       }
 
-        xlsx_path = os.path.join(self.dirpath, 'test_converters.xlsx')
-        xls_path = os.path.join(self.dirpath, 'test_converters.xls')
-        ods_path = os.path.join(self.dirpath, 'test_converters.ods')
-
         # should read in correctly and set types of single cells (not array dtypes)
-        for path in (xls_path, xlsx_path, ods_path):
+        for s in suffix:
+            path = os.path.join(self.dirpath, 'test_converters.%s' % s)
             actual = read_excel(path, 'Sheet1', converters=converters)
             tm.assert_frame_equal(actual, expected)