pandas-dev · ghost · Jan 20, 2018 · Jan 20, 2018 · Jan 20, 2018 · Jan 20, 2018
diff --git a/doc/source/whatsnew/v0.23.0.txt b/doc/source/whatsnew/v0.23.0.txt
@@ -509,6 +509,7 @@ Reshaping
 - Bug in :func:`DataFrame.merge` in which merging using ``Index`` objects as vectors raised an Exception (:issue:`19038`)
 - Bug in :func:`DataFrame.stack`, :func:`DataFrame.unstack`, :func:`Series.unstack` which were not returning subclasses (:issue:`15563`)
 - Bug in timezone comparisons, manifesting as a conversion of the index to UTC in ``.concat()`` (:issue:`18523`)
+- Bug in :func:`crosstab` where the added column is removed incorrectly (:issue:`18321`)
 -
 
 Numeric

diff --git a/pandas/core/reshape/pivot.py b/pandas/core/reshape/pivot.py
@@ -455,17 +455,23 @@ def crosstab(index, columns, values=None, rownames=None, colnames=None,
 
     from pandas import DataFrame
     df = DataFrame(data, index=common_idx)
+    common_cols_idx = df.columns
+
     if values is None:
         df['__dummy__'] = 0
         kwargs = {'aggfunc': len, 'fill_value': 0}
     else:
         df['__dummy__'] = values
         kwargs = {'aggfunc': aggfunc}
 
-    table = df.pivot_table('__dummy__', index=rownames, columns=colnames,
+    table = df.pivot_table(['__dummy__'], index=rownames, columns=colnames,
                            margins=margins, margins_name=margins_name,
                            dropna=dropna, **kwargs)
 
+    if not table.empty:
+        added_cols_idx = list(df.columns.difference(common_cols_idx))[0]
+        table = table[added_cols_idx]
+
     # Post-process
     if normalize is not False:
         table = _normalize(table, normalize=normalize, margins=margins,

diff --git a/pandas/tests/reshape/test_pivot.py b/pandas/tests/reshape/test_pivot.py
@@ -1628,7 +1628,8 @@ def test_crosstab_dup_index_names(self):
         pytest.raises(ValueError, pd.crosstab, s, s)
 
     @pytest.mark.parametrize("names", [['a', ('b', 'c')],
-                                       [('a', 'b'), 'c']])
+                                       [('a', 'b'), 'c'],
+                                       [('a', 'b'), ('c', 'd')]])
     def test_crosstab_tuple_name(self, names):
         s1 = pd.Series(range(3), name=names[0])
         s2 = pd.Series(range(1, 4), name=names[1])
@@ -1638,3 +1639,31 @@ def test_crosstab_tuple_name(self, names):
 
         result = pd.crosstab(s1, s2)
         tm.assert_frame_equal(result, expected)
+
+    @pytest.mark.parametrize("names", [['a', 'b'],
+                                       [('a', 'b'), 'c'],
+                                       [('a', 'b'), ('c', 'd')],
+                                       [(1, 2, 3), ('a', 'b', 'c')]])
+    def test_crosstab_cols_output(self, names):
+        rows = [[1, 2, 3, 4], [1, 1, 2, 2], [1, 3, 1, 4]]
+        cols = [[1, 1, 1, 1], [3, 2, 2, 3], []]
+
+        expected_ct1 = pd.DataFrame(
+            [1, 1, 1, 1],
+            index=pd.Index([1, 2, 3, 4], name=names[0]),
+            columns=pd.Index([1], name=names[1])
+        )
+        expected_ct2 = pd.DataFrame(
+            [[1, 1], [1, 1]],
+            index=pd.Index([1, 2], name=names[0]),
+            columns=pd.Index([2, 3], name=names[1])
+        )
+        expected_ct3 = pd.DataFrame([])
+        expected_arr = [expected_ct1, expected_ct2, expected_ct3]
+
+        for row, col, expected_data in zip(rows, cols, expected_arr):
+            s1 = pd.Series(row, name=names[0])
+            s2 = pd.Series(col, name=names[1])
+            result = pd.crosstab(s1, s2)
+            tm.assert_frame_equal(result, expected_data,
+                                  check_column_type=True)