TST: test coverage, pep8

wesm · wesm · commit 76da01b737f3 · 2012-02-09T10:49:30.000-05:00
diff --git a/pandas/core/frame.py b/pandas/core/frame.py
@@ -228,8 +228,8 @@ class DataFrame(NDFrame):
     _het_axis = 1
 
     _AXIS_NUMBERS = {
-        'index' : 0,
-        'columns' : 1
+        'index': 0,
+        'columns': 1
     }
 
     _AXIS_NAMES = dict((v, k) for k, v in _AXIS_NUMBERS.iteritems())
@@ -246,8 +246,8 @@ def __init__(self, data=None, index=None, columns=None, dtype=None,
         data : numpy ndarray (structured or homogeneous), dict, or DataFrame
             Dict can contain Series, arrays, constants, or list-like objects
         index : Index or array-like
-            Index to use for resulting frame. Will default to np.arange(n) if no
-            indexing information part of input data and no index provided
+            Index to use for resulting frame. Will default to np.arange(n) if
+            no indexing information part of input data and no index provided
         columns : Index or array-like
             Will default to np.arange(n) if not column labels provided
         dtype : dtype, default None
@@ -257,7 +257,7 @@ def __init__(self, data=None, index=None, columns=None, dtype=None,
 
         Examples
         --------
-        >>> d = {'col1' : ts1, 'col2' : ts2}
+        >>> d = {'col1': ts1, 'col2': ts2}
         >>> df = DataFrame(data=d, index=index)
         >>> df2 = DataFrame(np.random.randn(10, 5))
         >>> df3 = DataFrame(np.random.randn(10, 5),
@@ -535,7 +535,8 @@ def __contains__(self, key):
     # Python 2 division methods
     if not py3compat.PY3:
         __div__ = _arith_method(operator.div, '__div__', default_axis=None)
-        __rdiv__ = _arith_method(lambda x, y: y / x, '__rdiv__', default_axis=None)
+        __rdiv__ = _arith_method(lambda x, y: y / x, '__rdiv__',
+                                 default_axis=None)
 
     def __neg__(self):
         arr = operator.neg(self.values)
@@ -855,7 +856,7 @@ def _helper_csvexcel(self, writer, na_rep=None, cols=None, header=True,
                         index_label = []
                         for i, name in enumerate(self.index.names):
                             if name is None:
-                                name = '' # 'level_%d' % i
+                                name = ''
                             index_label.append(name)
                     else:
                         index_label = self.index.name
@@ -892,7 +893,7 @@ def _helper_csvexcel(self, writer, na_rep=None, cols=None, header=True,
             if index:
                 if nlevels == 1:
                     row_fields = [idx]
-                else: # handle MultiIndex
+                else:  # handle MultiIndex
                     row_fields = list(idx)
             for i, col in enumerate(cols):
                 val = series[col].get(idx)
@@ -960,8 +961,8 @@ def to_csv(self, path_or_buf, sep=",", na_rep='', cols=None,
             if close:
                 f.close()
 
-    def to_excel(self, excel_writer, sheet_name = 'sheet1', na_rep='', cols=None, header=True,
-                 index=True, index_label=None):
+    def to_excel(self, excel_writer, sheet_name='sheet1', na_rep='',
+                 cols=None, header=True, index=True, index_label=None):
         """
         Write DataFrame to a excel sheet
 
@@ -987,8 +988,8 @@ def to_excel(self, excel_writer, sheet_name = 'sheet1', na_rep='', cols=None, he
         Notes
         -----
         If passing an existing ExcelWriter object, then the sheet will be added
-        to the existing workbook.  This can be used to save different DataFrames
-        to one workbook
+        to the existing workbook.  This can be used to save different
+        DataFrames to one workbook
         >>> writer = ExcelWriter('output.xlsx')
         >>> df1.to_excel(writer,'sheet1')
         >>> df2.to_excel(writer,'sheet2')
@@ -1000,8 +1001,9 @@ def to_excel(self, excel_writer, sheet_name = 'sheet1', na_rep='', cols=None, he
             excel_writer = ExcelWriter(excel_writer)
             need_save = True
         excel_writer.cur_sheet = sheet_name
-        self._helper_csvexcel(excel_writer, na_rep=na_rep, cols=cols, header=header,
-                              index=index, index_label=index_label, encoding=None)
+        self._helper_csvexcel(excel_writer, na_rep=na_rep, cols=cols,
+                              header=header, index=index,
+                              index_label=index_label, encoding=None)
         if need_save:
             excel_writer.save()
 
@@ -1657,8 +1659,8 @@ def lookup(self, row_labels, col_labels):
 
     def align(self, other, join='outer', axis=None, level=None, copy=True):
         """
-        Align two DataFrame object on their index and columns with the specified
-        join method for each axis Index
+        Align two DataFrame object on their index and columns with the
+        specified join method for each axis Index
 
         Parameters
         ----------
@@ -2084,7 +2086,7 @@ def dropna(self, axis=0, how='any', thresh=None, subset=None):
         agg_obj = self
         if subset is not None:
             agg_axis_name = self._get_axis_name(agg_axis)
-            agg_obj = self.reindex(**{agg_axis_name : subset})
+            agg_obj = self.reindex(**{agg_axis_name: subset})
 
         count = agg_obj.count(axis=agg_axis)
 
@@ -2102,7 +2104,7 @@ def dropna(self, axis=0, how='any', thresh=None, subset=None):
 
         labels = self._get_axis(axis)
         new_labels = labels[mask]
-        return self.reindex(**{axis_name : new_labels})
+        return self.reindex(**{axis_name: new_labels})
 
     def drop_duplicates(self, cols=None, take_last=False):
         """
@@ -2280,7 +2282,8 @@ def reorder_levels(self, order, axis=0):
         -------
         type of caller (new object)
         """
-        if not isinstance(self._get_axis(axis), MultiIndex):  # pragma: no cover
+        if not isinstance(self._get_axis(axis),
+                          MultiIndex):  # pragma: no cover
             raise Exception('Can only reorder levels on a hierarchical axis.')
 
         result = self.copy()
@@ -2751,7 +2754,8 @@ def asfreq(self, freq, method=None):
         if isinstance(freq, datetools.DateOffset):
             dateRange = DateRange(self.index[0], self.index[-1], offset=freq)
         else:
-            dateRange = DateRange(self.index[0], self.index[-1], time_rule=freq)
+            dateRange = DateRange(self.index[0], self.index[-1],
+                                  time_rule=freq)
 
         return self.reindex(dateRange, method=method)
 
@@ -2864,8 +2868,8 @@ def apply(self, func, axis=0, broadcast=False, raw=False,
 
         Notes
         -----
-        Function passed should not have side effects. If the result is a Series,
-        it should have the same index
+        Function passed should not have side effects. If the result is a
+        Series, it should have the same index
 
         Returns
         -------
@@ -3038,7 +3042,8 @@ def append(self, other, ignore_index=False, verify_integrity=True):
             if isinstance(other, dict):
                 other = Series(other)
             if other.name is None and not ignore_index:
-                raise Exception('Can only append a Series if ignore_index=True')
+                raise Exception('Can only append a Series if '
+                                'ignore_index=True')
 
             index = None if other.name is None else [other.name]
             other = other.reindex(self.columns, copy=False)
@@ -3114,7 +3119,7 @@ def _join_compat(self, other, on=None, how='left', lsuffix='', rsuffix='',
 
         if isinstance(other, Series):
             assert(other.name is not None)
-            other = DataFrame({other.name : other})
+            other = DataFrame({other.name: other})
 
         if isinstance(other, DataFrame):
             return merge(self, other, left_on=on, how=how,
@@ -3343,7 +3348,8 @@ def _count_level(self, level, axis=0, numeric_only=False):
         if axis == 1:
             frame = frame.T
 
-        mask = notnull(frame.values).view(np.uint8) # python 2.5
+        # python 2.5
+        mask = notnull(frame.values).view(np.uint8)
 
         level_index = frame.index.levels[level]
         counts = lib.count_level_2d(mask, frame.index.labels[level],
@@ -3687,8 +3693,8 @@ def boxplot(self, column=None, by=None, ax=None, fontsize=None,
         """
         import pandas.tools.plotting as plots
         import matplotlib.pyplot as plt
-        ax = plots.boxplot(self, column=column, by=by, ax=ax, fontsize=fontsize,
-                           grid=grid, rot=rot, **kwds)
+        ax = plots.boxplot(self, column=column, by=by, ax=ax,
+                           fontsize=fontsize, grid=grid, rot=rot, **kwds)
         plt.draw_if_interactive()
         return ax
 
@@ -3791,7 +3797,7 @@ def _bar_plot(self, axes, subplots=False, use_index=True, grid=True,
                        bottom=np.zeros(N), linewidth=1, **kwds)
                 ax.set_title(col)
             else:
-                rects.append(ax.bar(xinds + i * 0.5/K, y, 0.5/K,
+                rects.append(ax.bar(xinds + i * 0.5 / K, y, 0.5 / K,
                                     bottom=np.zeros(N), label=col,
                                     color=colors[i % len(colors)], **kwds))
                 labels.append(col)
@@ -3907,7 +3913,7 @@ def group_agg(values, bounds, f):
         else:
             right_bound = bounds[i + 1]
 
-        result[i] = f(values[left_bound : right_bound])
+        result[i] = f(values[left_bound:right_bound])
 
     return result
 
@@ -4027,6 +4033,7 @@ def _rec_to_dict(arr):
 
     return columns, sdict
 
+
 def _list_to_sdict(data, columns):
     if len(data) > 0 and isinstance(data[0], tuple):
         content = list(lib.to_object_array_tuples(data).T)
@@ -4039,6 +4046,7 @@ def _list_to_sdict(data, columns):
         return {}, columns
     return _convert_object_array(content, columns)
 
+
 def _list_of_dict_to_sdict(data, columns):
     if columns is None:
         gen = (x.keys() for x in data)
@@ -4047,6 +4055,7 @@ def _list_of_dict_to_sdict(data, columns):
     content = list(lib.dicts_to_array(data, list(columns)).T)
     return _convert_object_array(content, columns)
 
+
 def _convert_object_array(content, columns):
     if columns is None:
         columns = range(len(content))
@@ -4059,6 +4068,7 @@ def _convert_object_array(content, columns):
                  for c, vals in zip(columns, content))
     return sdict, columns
 
+
 def _homogenize(data, index, columns, dtype=None):
     from pandas.core.series import _sanitize_array
 
@@ -4104,9 +4114,11 @@ def _homogenize(data, index, columns, dtype=None):
 
     return homogenized
 
+
 def _put_str(s, space):
     return ('%s' % s)[:space].ljust(space)
 
+
 def _is_sequence(x):
     try:
         iter(x)
@@ -4115,6 +4127,7 @@ def _is_sequence(x):
     except Exception:
         return False
 
+
 def install_ipython_completers():  # pragma: no cover
     """Register the DataFrame type with IPython's tab completion machinery, so
     that it knows about accessing column names as attributes."""
@@ -4125,6 +4138,7 @@ def complete_dataframe(obj, prev_completions):
         return prev_completions + [c for c in obj.columns \
                     if isinstance(c, basestring) and py3compat.isidentifier(c)]
 
+
 # Importing IPython brings in about 200 modules, so we want to avoid it unless
 # we're in IPython (when those modules are loaded anyway).
 if "IPython" in sys.modules:  # pragma: no cover
@@ -4133,6 +4147,7 @@ def complete_dataframe(obj, prev_completions):
     except Exception:
         pass
 
+
 def _indexer_from_factorized(labels, shape, compress=True):
     from pandas.core.groupby import get_group_index, _compress_group_index
 
@@ -4149,6 +4164,7 @@ def _indexer_from_factorized(labels, shape, compress=True):
 
     return indexer
 
+
 def _lexsort_indexer(keys):
     labels = []
     shape = []
@@ -4163,6 +4179,7 @@ def _lexsort_indexer(keys):
         shape.append(len(rizer.uniques))
     return _indexer_from_factorized(labels, shape)
 
+
 if __name__ == '__main__':
     import nose
     nose.runmodule(argv=[__file__, '-vvs', '-x', '--pdb', '--pdb-failure'],
diff --git a/pandas/sparse/tests/test_sparse.py b/pandas/sparse/tests/test_sparse.py
@@ -864,6 +864,9 @@ def _compare_to_dense(a, b, da, db, op):
                 _compare_to_dense(s, frame, s,
                                   frame.to_dense(), op)
 
+        # it works!
+        result = self.frame + self.frame.ix[:, ['A', 'B']]
+
     def test_op_corners(self):
         empty = self.empty + self.empty
         self.assert_(not empty)
@@ -1126,6 +1129,11 @@ def _check_frame(frame):
         reindexed['G'] = reindexed['A']
         self.assert_('G' not in self.frame)
 
+    def test_take(self):
+        result = self.frame.take([1, 0, 2], axis=1)
+        expected = self.frame.reindex(columns=['B', 'A', 'C'])
+        assert_sp_frame_equal(result, expected)
+
     def test_density(self):
         df = SparseDataFrame({'A' : [nan, nan, nan, 0, 1, 2, 3, 4, 5, 6],
                               'B' : [0, 1, 2, nan, nan, nan, 3, 4, 5, 6],