@@ -239,42 +239,6 @@ def time_merge_dataframe_integer_key(self):
239
239
merge (self .df , self .df2 , on = 'key1' )
240
240
241
241
242
- class merge_asof_int32_noby (object ):
243
-
244
- def setup (self ):
245
- np .random .seed (0 )
246
- one_count = 200000
247
- two_count = 1000000
248
- self .df1 = pd .DataFrame ({'time' : np .random .randint (0 , one_count / 20 , one_count ),
249
- 'value1' : np .random .randn (one_count )})
250
- self .df1 .time = np .int32 (self .df1 .time )
251
- self .df2 = pd .DataFrame ({'time' : np .random .randint (0 , two_count / 20 , two_count ),
252
- 'value2' : np .random .randn (two_count )})
253
- self .df2 .time = np .int32 (self .df2 .time )
254
- self .df1 = self .df1 .sort_values ('time' )
255
- self .df2 = self .df2 .sort_values ('time' )
256
-
257
- def time_merge_asof_int32_noby (self ):
258
- merge_asof (self .df1 , self .df2 , on = 'time' )
259
-
260
-
261
- class merge_asof_by_object (object ):
262
-
263
- def setup (self ):
264
- import string
265
- np .random .seed (0 )
266
- one_count = 200000
267
- two_count = 1000000
268
- self .df1 = pd .DataFrame ({'time' : np .random .randint (0 , one_count / 20 , one_count ),
269
- 'key' : np .random .choice (list (string .ascii_uppercase ), one_count ),
270
- 'value1' : np .random .randn (one_count )})
271
- self .df2 = pd .DataFrame ({'time' : np .random .randint (0 , two_count / 20 , two_count ),
272
- 'key' : np .random .choice (list (string .ascii_uppercase ), two_count ),
273
- 'value2' : np .random .randn (two_count )})
274
- self .df1 = self .df1 .sort_values ('time' )
275
- self .df2 = self .df2 .sort_values ('time' )
276
-
277
-
278
242
class i8merge (object ):
279
243
goal_time = 0.2
280
244
@@ -306,35 +270,8 @@ def setup(self):
306
270
'key' : np .tile (np .arange (0 , 10000 , 2 ), 10 ),
307
271
'lvalue' : np .random .randn (50000 )})
308
272
309
- < << << << HEAD
310
- class merge_asof_multiby (object ):
311
-
312
- def setup (self ):
313
- import string
314
- np .random .seed (0 )
315
- one_count = 200000
316
- two_count = 1000000
317
- self .df1 = pd .DataFrame ({'time' : np .random .randint (0 , one_count / 20 , one_count ),
318
- 'key1' : np .random .choice (list (string .ascii_uppercase ), one_count ),
319
- 'key2' : np .random .choice (list (string .ascii_uppercase ), one_count ),
320
- 'value1' : np .random .randn (one_count )})
321
- self .df2 = pd .DataFrame ({'time' : np .random .randint (0 , two_count / 20 , two_count ),
322
- 'key1' : np .random .choice (list (string .ascii_uppercase ), two_count ),
323
- 'key2' : np .random .choice (list (string .ascii_uppercase ), two_count ),
324
- 'value2' : np .random .randn (two_count )})
325
- self .df1 = self .df1 .sort_values ('time' )
326
- self .df2 = self .df2 .sort_values ('time' )
327
-
328
- def time_merge_asof_multiby (self ):
329
- merge_asof (self .df1 , self .df2 , on = 'time' , by = ['key1' , 'key2' ])
330
-
331
-
332
- class join_non_unique_equal (object ):
333
- goal_time = 0.2
334
- == == == =
335
273
self .right = pd .DataFrame ({'key' : np .arange (10000 ),
336
274
'rvalue' : np .random .randn (10000 )})
337
- >> >> >> > master
338
275
339
276
def time_merge_ordered (self ):
340
277
merge_ordered (self .left , self .right , on = 'key' , left_by = 'group' )
@@ -365,12 +302,19 @@ def setup(self):
365
302
self .df1 = self .df1 .sort_values ('time' )
366
303
self .df2 = self .df2 .sort_values ('time' )
367
304
305
+ self .df1 ['time32' ] = np .int32 (self .df1 .time )
306
+ self .df2 ['time32' ] = np .int32 (self .df2 .time )
307
+
368
308
self .df1a = self .df1 [['time' , 'value1' ]]
369
309
self .df2a = self .df2 [['time' , 'value2' ]]
370
310
self .df1b = self .df1 [['time' , 'key' , 'value1' ]]
371
311
self .df2b = self .df2 [['time' , 'key' , 'value2' ]]
372
312
self .df1c = self .df1 [['time' , 'key2' , 'value1' ]]
373
313
self .df2c = self .df2 [['time' , 'key2' , 'value2' ]]
314
+ self .df1d = self .df1 [['time32' , 'value1' ]]
315
+ self .df2d = self .df2 [['time32' , 'value2' ]]
316
+ self .df1e = self .df1 [['time' , 'key' , 'key2' , 'value1' ]]
317
+ self .df2e = self .df2 [['time' , 'key' , 'key2' , 'value2' ]]
374
318
375
319
def time_noby (self ):
376
320
merge_asof (self .df1a , self .df2a , on = 'time' )
@@ -381,6 +325,12 @@ def time_by_object(self):
381
325
def time_by_int (self ):
382
326
merge_asof (self .df1c , self .df2c , on = 'time' , by = 'key2' )
383
327
328
+ def time_on_int32 (self ):
329
+ merge_asof (self .df1d , self .df2d , on = 'time32' )
330
+
331
+ def time_multiby (self ):
332
+ merge_asof (self .df1e , self .df2e , on = 'time' , by = ['key' , 'key2' ])
333
+
384
334
385
335
#----------------------------------------------------------------------
386
336
# data alignment
0 commit comments