Skip to content

Commit fafbb02

Browse files
author
Christopher C. Aycock
committed
Updated benchmarks to reflect new ASV setup
1 parent 5eeb7d9 commit fafbb02

File tree

1 file changed

+13
-63
lines changed

1 file changed

+13
-63
lines changed

asv_bench/benchmarks/join_merge.py

+13-63
Original file line numberDiff line numberDiff line change
@@ -239,42 +239,6 @@ def time_merge_dataframe_integer_key(self):
239239
merge(self.df, self.df2, on='key1')
240240

241241

242-
class merge_asof_int32_noby(object):
243-
244-
def setup(self):
245-
np.random.seed(0)
246-
one_count = 200000
247-
two_count = 1000000
248-
self.df1 = pd.DataFrame({'time': np.random.randint(0, one_count/20, one_count),
249-
'value1': np.random.randn(one_count)})
250-
self.df1.time = np.int32(self.df1.time)
251-
self.df2 = pd.DataFrame({'time': np.random.randint(0, two_count/20, two_count),
252-
'value2': np.random.randn(two_count)})
253-
self.df2.time = np.int32(self.df2.time)
254-
self.df1 = self.df1.sort_values('time')
255-
self.df2 = self.df2.sort_values('time')
256-
257-
def time_merge_asof_int32_noby(self):
258-
merge_asof(self.df1, self.df2, on='time')
259-
260-
261-
class merge_asof_by_object(object):
262-
263-
def setup(self):
264-
import string
265-
np.random.seed(0)
266-
one_count = 200000
267-
two_count = 1000000
268-
self.df1 = pd.DataFrame({'time': np.random.randint(0, one_count/20, one_count),
269-
'key': np.random.choice(list(string.ascii_uppercase), one_count),
270-
'value1': np.random.randn(one_count)})
271-
self.df2 = pd.DataFrame({'time': np.random.randint(0, two_count/20, two_count),
272-
'key': np.random.choice(list(string.ascii_uppercase), two_count),
273-
'value2': np.random.randn(two_count)})
274-
self.df1 = self.df1.sort_values('time')
275-
self.df2 = self.df2.sort_values('time')
276-
277-
278242
class i8merge(object):
279243
goal_time = 0.2
280244

@@ -306,35 +270,8 @@ def setup(self):
306270
'key' : np.tile(np.arange(0, 10000, 2), 10),
307271
'lvalue': np.random.randn(50000)})
308272

309-
<<<<<<< HEAD
310-
class merge_asof_multiby(object):
311-
312-
def setup(self):
313-
import string
314-
np.random.seed(0)
315-
one_count = 200000
316-
two_count = 1000000
317-
self.df1 = pd.DataFrame({'time': np.random.randint(0, one_count/20, one_count),
318-
'key1': np.random.choice(list(string.ascii_uppercase), one_count),
319-
'key2': np.random.choice(list(string.ascii_uppercase), one_count),
320-
'value1': np.random.randn(one_count)})
321-
self.df2 = pd.DataFrame({'time': np.random.randint(0, two_count/20, two_count),
322-
'key1': np.random.choice(list(string.ascii_uppercase), two_count),
323-
'key2': np.random.choice(list(string.ascii_uppercase), two_count),
324-
'value2': np.random.randn(two_count)})
325-
self.df1 = self.df1.sort_values('time')
326-
self.df2 = self.df2.sort_values('time')
327-
328-
def time_merge_asof_multiby(self):
329-
merge_asof(self.df1, self.df2, on='time', by=['key1', 'key2'])
330-
331-
332-
class join_non_unique_equal(object):
333-
goal_time = 0.2
334-
=======
335273
self.right = pd.DataFrame({'key' : np.arange(10000),
336274
'rvalue' : np.random.randn(10000)})
337-
>>>>>>> master
338275

339276
def time_merge_ordered(self):
340277
merge_ordered(self.left, self.right, on='key', left_by='group')
@@ -365,12 +302,19 @@ def setup(self):
365302
self.df1 = self.df1.sort_values('time')
366303
self.df2 = self.df2.sort_values('time')
367304

305+
self.df1['time32'] = np.int32(self.df1.time)
306+
self.df2['time32'] = np.int32(self.df2.time)
307+
368308
self.df1a = self.df1[['time', 'value1']]
369309
self.df2a = self.df2[['time', 'value2']]
370310
self.df1b = self.df1[['time', 'key', 'value1']]
371311
self.df2b = self.df2[['time', 'key', 'value2']]
372312
self.df1c = self.df1[['time', 'key2', 'value1']]
373313
self.df2c = self.df2[['time', 'key2', 'value2']]
314+
self.df1d = self.df1[['time32', 'value1']]
315+
self.df2d = self.df2[['time32', 'value2']]
316+
self.df1e = self.df1[['time', 'key', 'key2', 'value1']]
317+
self.df2e = self.df2[['time', 'key', 'key2', 'value2']]
374318

375319
def time_noby(self):
376320
merge_asof(self.df1a, self.df2a, on='time')
@@ -381,6 +325,12 @@ def time_by_object(self):
381325
def time_by_int(self):
382326
merge_asof(self.df1c, self.df2c, on='time', by='key2')
383327

328+
def time_on_int32(self):
329+
merge_asof(self.df1d, self.df2d, on='time32')
330+
331+
def time_multiby(self):
332+
merge_asof(self.df1e, self.df2e, on='time', by=['key', 'key2'])
333+
384334

385335
#----------------------------------------------------------------------
386336
# data alignment

0 commit comments

Comments
 (0)