revsised according to comments

jreback · jreback · commit a80ae5ef10a6 · 2015-05-08T16:26:02.000-04:00
diff --git a/doc/source/whatsnew/v0.16.1.txt b/doc/source/whatsnew/v0.16.1.txt
@@ -253,8 +253,7 @@ API changes
 Index Representation
 ~~~~~~~~~~~~~~~~~~~~
 
-The string representation of ``Index`` and its sub-classes have now been unified. ``Index, Int64Index, Float64Index, CategoricalIndex`` are single-line display. The datetimelikes ``DatetimeIndex, PeriodIndex, TimedeltaIndex`` & ``MultiIndex`` will display in a multi-line format showing much more of the index values. The display width responds to the option ``display.max_seq_items``,
-which is defaulted to 100. (:issue:`6482`)
+The string representation of ``Index`` and its sub-classes have now been unified. These will show a single-line display if there are few values; a wrapped multi-line display for a lot of values (but less than ``display.max_seq_items``; if lots of items (> ``display.max_seq_items``) will show a truncated display (the head and tail of the data). The formatting for ``MultiIndex`` is unchanges (a multi-line wrapped display). The display width responds to the option ``display.max_seq_items``, which is defaulted to 100. (:issue:`6482`)
 
 Previous Behavior
 
@@ -289,6 +288,11 @@ New Behavior
    pd.Index(range(4),name='foo')
    pd.Index(range(25),name='foo')
    pd.Index(range(104),name='foo')
+   pd.CategoricalIndex(['a','bb','ccc','dddd'],ordered=True,name='foobar')
+   pd.CategoricalIndex(['a','bb','ccc','dddd']*10,ordered=True,name='foobar')
+   pd.CategoricalIndex(['a','bb','ccc','dddd']*100,ordered=True,name='foobar')
+   pd.CategoricalIndex(np.arange(1000),ordered=True,name='foobar')
+   pd.Index(['a','bb','ccc','dddd']*100)
    pd.date_range('20130101',periods=4,name='foo',tz='US/Eastern')
    pd.date_range('20130101',periods=25,name='foo',tz='US/Eastern')
    pd.date_range('20130101',periods=104,name='foo',tz='US/Eastern')
diff --git a/pandas/core/index.py b/pandas/core/index.py
@@ -440,6 +440,7 @@ def _format_data(self):
         sep = ','
         max_seq_items = get_option('display.max_seq_items')
         formatter = self._formatter_func
+        needs_justify = self.inferred_type in ['string','categorical']
 
         def best_len(values):
             return max([len(x) for x in values]) + 2
@@ -453,23 +454,27 @@ def best_rows(values, max_len):
             n_rows = int(ceil(len(values) / float(n_per_row)))
             return n_per_row, n_rows
 
-        def best_fit(values, max_len, justify=False):
+        def best_fit(values, max_len, n_rows=None, justify=False):
 
             # number of rows to generate
-            n_per_row, n_rows = best_rows(values, max_len)
+            if n_rows is None:
+                n_per_row, n_rows = best_rows(values, max_len)
+            else:
+                n_per_row = len(values)
 
             # adjust all values to max length if we have multi-lines
-            if n_rows > 1 or justify:
+            if justify:
                 values = [values[0].rjust(max_len-2)] + [x.rjust(max_len-1) for x in values[1:]]
-                sep_elements = sep
+                multi_line_space = space1
             else:
-                sep_elements = sep + ' '
+                multi_line_space = space2
 
+            sep_elements = sep + ' '
             summary = ''
             for i in range(n_rows - 1):
-                summary += sep.join(values[i*n_per_row:(i+1)*n_per_row])
+                summary += sep_elements.join(values[i*n_per_row:(i+1)*n_per_row])
                 summary += sep
-                summary += space1
+                summary += multi_line_space
             summary += sep_elements.join(values[(n_rows - 1)*n_per_row:n_rows*n_per_row])
 
             return summary
@@ -491,10 +496,17 @@ def best_fit(values, max_len, justify=False):
             tail = [ formatter(x) for x in self[-n:] ]
             max_len = max(best_len(head),best_len(tail))
 
+            if needs_justify:
+                n_rows = 1
+                justify = False
+            else:
+                n_rows = None
+                justify = True
+
             summary = '['
-            summary += best_fit(head, max_len, justify=True)
+            summary += best_fit(head, max_len, n_rows=n_rows, justify=justify)
             summary += ',' + space1 + ' ...' + space2
-            summary += best_fit(tail, max_len, justify=True)
+            summary += best_fit(tail, max_len, n_rows=n_rows, justify=justify)
             summary += '],'
             summary += space1
 
@@ -2936,7 +2948,9 @@ def _format_attrs(self):
         """
         Return a list of tuples of the (attr,formatted_value)
         """
-        attrs = [('categories', default_pprint(self.categories)),
+        max_categories = (10 if get_option("display.max_categories") == 0
+                    else get_option("display.max_categories"))
+        attrs = [('categories', default_pprint(self.categories, max_seq_items=max_categories)),
                  ('ordered',self.ordered)]
         if self.name is not None:
             attrs.append(('name',default_pprint(self.name)))
diff --git a/pandas/tests/test_index.py b/pandas/tests/test_index.py
@@ -2463,7 +2463,7 @@ def test_print_unicode_columns(self):
     def test_repr_summary(self):
         with cf.option_context('display.max_seq_items', 10):
             r = repr(pd.Index(np.arange(1000)))
-            self.assertTrue(len(r) < 150)
+            self.assertTrue(len(r) < 200)
             self.assertTrue("..." in r)
 
     def test_repr_roundtrip(self):