@@ -90,7 +90,7 @@ cdef class ObjectFactorizer(Factorizer):
90
90
self .uniques = ObjectVector()
91
91
92
92
def factorize (
93
- self , ndarray[object] values , sort = False , na_sentinel = - 1 , na_value = None
93
+ self , ndarray[object] values , na_sentinel = - 1 , na_value = None
94
94
) -> np.ndarray:
95
95
"""
96
96
@@ -115,14 +115,6 @@ cdef class ObjectFactorizer(Factorizer):
115
115
self.uniques = uniques
116
116
labels = self .table.get_labels(values, self .uniques,
117
117
self .count, na_sentinel, na_value)
118
- mask = (labels == na_sentinel)
119
- # sort on
120
- if sort:
121
- sorter = self .uniques.to_array().argsort()
122
- reverse_indexer = np.empty(len (sorter), dtype = np.intp)
123
- reverse_indexer.put(sorter , np.arange(len(sorter )))
124
- labels = reverse_indexer.take(labels, mode = ' clip' )
125
- labels[mask] = na_sentinel
126
118
self.count = len (self .uniques)
127
119
return labels
128
120
@@ -136,7 +128,7 @@ cdef class Int64Factorizer(Factorizer):
136
128
self .table = Int64HashTable(size_hint)
137
129
self .uniques = Int64Vector()
138
130
139
- def factorize (self , const int64_t[:] values , sort = False ,
131
+ def factorize (self , const int64_t[:] values ,
140
132
na_sentinel = - 1 , na_value = None ) -> np.ndarray:
141
133
"""
142
134
Returns
@@ -161,14 +153,5 @@ cdef class Int64Factorizer(Factorizer):
161
153
labels = self .table.get_labels(values, self .uniques,
162
154
self .count, na_sentinel,
163
155
na_value = na_value)
164
-
165
- # sort on
166
- if sort:
167
- sorter = self .uniques.to_array().argsort()
168
- reverse_indexer = np.empty(len (sorter), dtype = np.intp)
169
- reverse_indexer.put(sorter , np.arange(len(sorter )))
170
-
171
- labels = reverse_indexer.take(labels)
172
-
173
156
self.count = len (self .uniques)
174
157
return labels
0 commit comments