@@ -312,11 +312,15 @@ def test_join_on(setup):
312
312
expected4 .set_index ("a2" , inplace = True )
313
313
result4 .set_index ("a2" , inplace = True )
314
314
pd .testing .assert_frame_equal (
315
- sort_dataframe_inplace (expected4 , 0 ), sort_dataframe_inplace (result4 , 0 )
315
+ sort_dataframe_inplace (expected4 , 0 , kind = "mergesort" ),
316
+ sort_dataframe_inplace (result4 , 0 , kind = "mergesort" ),
316
317
)
317
318
318
319
319
320
def test_merge_one_chunk (setup ):
321
+ def sort_by_col1 (df ):
322
+ return df .sort_values (by = df .columns [1 ], kind = "mergesort" )
323
+
320
324
df1 = pd .DataFrame (
321
325
{"lkey" : ["foo" , "bar" , "baz" , "foo" ], "value" : [1 , 2 , 3 , 5 ]},
322
326
index = ["a1" , "a2" , "a3" , "a4" ],
@@ -348,8 +352,8 @@ def test_merge_one_chunk(setup):
348
352
result = jdf .execute ().fetch ()
349
353
350
354
pd .testing .assert_frame_equal (
351
- expected . sort_values ( by = expected . columns [ 1 ] ).reset_index (drop = True ),
352
- result . sort_values ( by = result . columns [ 1 ] ).reset_index (drop = True ),
355
+ sort_by_col1 ( expected ).reset_index (drop = True ),
356
+ sort_by_col1 ( result ).reset_index (drop = True ),
353
357
)
354
358
355
359
# right have one chunk
@@ -361,8 +365,8 @@ def test_merge_one_chunk(setup):
361
365
result = jdf .execute ().fetch ()
362
366
363
367
pd .testing .assert_frame_equal (
364
- expected . sort_values ( by = expected . columns [ 1 ] ).reset_index (drop = True ),
365
- result . sort_values ( by = result . columns [ 1 ] ).reset_index (drop = True ),
368
+ sort_by_col1 ( expected ).reset_index (drop = True ),
369
+ sort_by_col1 ( result ).reset_index (drop = True ),
366
370
)
367
371
368
372
# left have one chunk and how="left", then one chunk tile
@@ -377,8 +381,8 @@ def test_merge_one_chunk(setup):
377
381
result = jdf .execute ().fetch ()
378
382
379
383
pd .testing .assert_frame_equal (
380
- expected . sort_values ( by = expected . columns [ 1 ] ).reset_index (drop = True ),
381
- result . sort_values ( by = result . columns [ 1 ] ).reset_index (drop = True ),
384
+ sort_by_col1 ( expected ).reset_index (drop = True ),
385
+ sort_by_col1 ( result ).reset_index (drop = True ),
382
386
)
383
387
384
388
@@ -418,7 +422,8 @@ def test_broadcast_merge(setup):
418
422
expected .set_index ("key" , inplace = True )
419
423
result .set_index ("key" , inplace = True )
420
424
pd .testing .assert_frame_equal (
421
- sort_dataframe_inplace (expected , 0 ), sort_dataframe_inplace (result , 0 )
425
+ sort_dataframe_inplace (expected , 0 , kind = "mergesort" ),
426
+ sort_dataframe_inplace (result , 0 , kind = "mergesort" ),
422
427
)
423
428
424
429
# test broadcast right and how="left"
@@ -438,8 +443,8 @@ def test_broadcast_merge(setup):
438
443
expected .set_index ("key" , inplace = True )
439
444
result .set_index ("key" , inplace = True )
440
445
pd .testing .assert_frame_equal (
441
- expected .sort_values (by = ["key" , "value_x" ]),
442
- result .sort_values (by = ["key" , "value_x" ]),
446
+ expected .sort_values (by = ["key" , "value_x" ], kind = "mergesort" ),
447
+ result .sort_values (by = ["key" , "value_x" ], kind = "mergesort" ),
443
448
)
444
449
445
450
# test broadcast left
@@ -459,7 +464,8 @@ def test_broadcast_merge(setup):
459
464
expected .set_index ("key" , inplace = True )
460
465
result .set_index ("key" , inplace = True )
461
466
pd .testing .assert_frame_equal (
462
- sort_dataframe_inplace (expected , 0 ), sort_dataframe_inplace (result , 0 )
467
+ sort_dataframe_inplace (expected , 0 , kind = "mergesort" ),
468
+ sort_dataframe_inplace (result , 0 , kind = "mergesort" ),
463
469
)
464
470
465
471
# test broadcast left and how="right"
@@ -479,8 +485,8 @@ def test_broadcast_merge(setup):
479
485
expected .set_index ("key" , inplace = True )
480
486
result .set_index ("key" , inplace = True )
481
487
pd .testing .assert_frame_equal (
482
- expected .sort_values (by = ["key" , "value_x" ]),
483
- result .sort_values (by = ["key" , "value_x" ]),
488
+ expected .sort_values (by = ["key" , "value_x" ], kind = "mergesort" ),
489
+ result .sort_values (by = ["key" , "value_x" ], kind = "mergesort" ),
484
490
)
485
491
486
492
0 commit comments