1
1
# coding: utf-8
2
2
import pandas as pd
3
+ from textwrap import dedent
3
4
4
5
import dask .dataframe as dd
5
6
from dask .dataframe .utils import PANDAS_VERSION
@@ -440,14 +441,26 @@ def test_index_format():
440
441
s = pd .Series ([1 , 2 , 3 , 4 , 5 , 6 , 7 , 8 ],
441
442
index = pd .CategoricalIndex ([1 , 2 , 3 , 4 , 5 , 6 , 7 , 8 ], name = 'YYY' ))
442
443
ds = dd .from_pandas (s , 3 )
443
- exp = """Dask Index Structure:
444
- npartitions=3
445
- 1 category[known]
446
- 4 ...
447
- 7 ...
448
- 8 ...
449
- Name: YYY, dtype: category
450
- Dask Name: from_pandas, 6 tasks"""
444
+ if PANDAS_VERSION >= '0.21.0' :
445
+ exp = dedent ("""\
446
+ Dask Index Structure:
447
+ npartitions=3
448
+ 1 category[known]
449
+ 4 ...
450
+ 7 ...
451
+ 8 ...
452
+ Name: YYY, dtype: CategoricalDtype(categories=[1, 2, 3, 4, 5, 6, 7, 8], ordered=False)
453
+ Dask Name: from_pandas, 6 tasks""" )
454
+ else :
455
+ exp = dedent ("""\
456
+ Dask Index Structure:
457
+ npartitions=3
458
+ 1 category[known]
459
+ 4 ...
460
+ 7 ...
461
+ 8 ...
462
+ Name: YYY, dtype: category
463
+ Dask Name: from_pandas, 6 tasks""" )
451
464
assert repr (ds .index ) == exp
452
465
assert str (ds .index ) == exp
453
466
@@ -456,17 +469,36 @@ def test_categorical_format():
456
469
s = pd .Series (['a' , 'b' , 'c' ]).astype ('category' )
457
470
known = dd .from_pandas (s , npartitions = 1 )
458
471
unknown = known .cat .as_unknown ()
459
- exp = ("Dask Series Structure:\n "
460
- "npartitions=1\n "
461
- "0 category[known]\n "
462
- "2 ...\n "
463
- "dtype: category\n "
464
- "Dask Name: from_pandas, 1 tasks" )
472
+ if PANDAS_VERSION >= '0.21.0' :
473
+ exp = dedent ("""\
474
+ Dask Series Structure:
475
+ npartitions=1
476
+ 0 category[known]
477
+ 2 ...
478
+ dtype: CategoricalDtype(categories=['a', 'b', 'c'], ordered=False)
479
+ Dask Name: from_pandas, 1 tasks""" )
480
+ else :
481
+ exp = ("Dask Series Structure:\n "
482
+ "npartitions=1\n "
483
+ "0 category[known]\n "
484
+ "2 ...\n "
485
+ "dtype: category\n "
486
+ "Dask Name: from_pandas, 1 tasks" )
465
487
assert repr (known ) == exp
466
- exp = ("Dask Series Structure:\n "
467
- "npartitions=1\n "
468
- "0 category[unknown]\n "
469
- "2 ...\n "
470
- "dtype: category\n "
471
- "Dask Name: from_pandas, 1 tasks" )
488
+ if PANDAS_VERSION >= '0.21.0' :
489
+ exp = dedent ("""\
490
+ Dask Series Structure:
491
+ npartitions=1
492
+ 0 category[unknown]
493
+ 2 ...
494
+ dtype: CategoricalDtype(categories=['__UNKNOWN_CATEGORIES__'], ordered=False)
495
+ Dask Name: from_pandas, 1 tasks""" )
496
+
497
+ else :
498
+ exp = ("Dask Series Structure:\n "
499
+ "npartitions=1\n "
500
+ "0 category[unknown]\n "
501
+ "2 ...\n "
502
+ "dtype: category\n "
503
+ "Dask Name: from_pandas, 1 tasks" )
472
504
assert repr (unknown ) == exp
0 commit comments