pandas-dev · lgautier · Jul 21, 2013 · Jul 21, 2013 · Jul 22, 2013 · Jul 22, 2013
diff --git a/pandas/core/frame.py b/pandas/core/frame.py
@@ -5680,6 +5680,9 @@ def _arrays_to_mgr(arrays, arr_names, index, columns, dtype=None):
     return create_block_manager_from_arrays(arrays, arr_names, axes)
 
 def extract_index(data):
+    # Slightly misleading name.
+    # Indexes are only extracted for elements in the iterable
+    # `data` inheriting from Series.
     from pandas.core.index import _union_indexes
 
     index = None
@@ -5693,19 +5696,31 @@ def extract_index(data):
         have_series = False
         have_dicts = False
 
+        # Loop over the element, such as vectors `v` corresponding
+        # to columns in the DataFrame  
         for v in data:
             if isinstance(v, Series):
                 have_series = True
                 indexes.append(v.index)
             elif isinstance(v, dict):
                 have_dicts = True
                 indexes.append(v.keys())
-            elif isinstance(v, (list, tuple, np.ndarray)):
+            elif com._is_sequence(v):
+                # This is a sequence-but-not-a-string
+                # Although strings have a __len__,
+                # they will be considered scalar.
                 have_raw_arrays = True
                 raw_lengths.append(len(v))
+            else:
+                # Item v silently ignored (to conserve
+                # the original behaviour - see also
+                # test of __getitem__ below).
+                # This behaviour is kept, but I think
+                # that an exception (TypeError) should be raised instead.
+                pass
 
         if not indexes and not raw_lengths:
-            raise ValueError('If using all scalar values, you must must pass'
+            raise ValueError('If using all scalar values, you must pass'
                              ' an index')
 
         if have_series or have_dicts:
@@ -5714,15 +5729,15 @@ def extract_index(data):
         if have_raw_arrays:
             lengths = list(set(raw_lengths))
             if len(lengths) > 1:
-                raise ValueError('arrays must all be same length')
+                raise ValueError('Arrays must all be same length')
 
             if have_dicts:
                 raise ValueError('Mixing dicts with non-Series may lead to '
                                  'ambiguous ordering.')
 
             if have_series:
                 if lengths[0] != len(index):
-                    msg = ('array length %d does not match index length %d'
+                    msg = ('Array length %d does not match index length %d'
                            % (lengths[0], len(index)))
                     raise ValueError(msg)
             else:

diff --git a/pandas/tests/test_frame.py b/pandas/tests/test_frame.py
@@ -2236,7 +2236,7 @@ def testit():
 
         def testit():
             DataFrame({'a': False, 'b': True})
-        assertRaisesRegexp(ValueError, 'If using all scalar values, you must must pass an index', testit)
+        assertRaisesRegexp(ValueError, 'If using all scalar values, you must pass an index', testit)
 
     def test_insert_error_msmgs(self):
 
@@ -2774,6 +2774,17 @@ def test_constructor_from_items(self):
         # pass some columns
         recons = DataFrame.from_items(items, columns=['C', 'B', 'A'])
         assert_frame_equal(recons, self.frame.ix[:, ['C', 'B', 'A']])
+        # not any column either a dict, a list, a tuple, or a numpy.ndarray
+        import array
+        recons_ar = DataFrame.from_items([('A', array.array('i', range(10)))])
+        recons_rg = DataFrame.from_items([('A', range(10))])
+        recons_np = DataFrame.from_items([('A', np.array(range(10)))])
+        self.assertEquals(tuple(recons_ar['A']),
+                          tuple(recons_rg['A']))
+        self.assertEquals(tuple(recons_ar['A']),
+                          tuple(recons_np['A']))
+
+
 
         # orient='index'