Skip to content

Commit 576923b

Browse files
committed
Fix test failures
1 parent 0a42ba8 commit 576923b

File tree

4 files changed

+23
-22
lines changed

4 files changed

+23
-22
lines changed

mars/dataframe/merge/tests/test_merge_execution.py

Lines changed: 19 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -312,11 +312,15 @@ def test_join_on(setup):
312312
expected4.set_index("a2", inplace=True)
313313
result4.set_index("a2", inplace=True)
314314
pd.testing.assert_frame_equal(
315-
sort_dataframe_inplace(expected4, 0), sort_dataframe_inplace(result4, 0)
315+
sort_dataframe_inplace(expected4, 0, kind="mergesort"),
316+
sort_dataframe_inplace(result4, 0, kind="mergesort"),
316317
)
317318

318319

319320
def test_merge_one_chunk(setup):
321+
def sort_by_col1(df):
322+
return df.sort_values(by=df.columns[1], kind="mergesort")
323+
320324
df1 = pd.DataFrame(
321325
{"lkey": ["foo", "bar", "baz", "foo"], "value": [1, 2, 3, 5]},
322326
index=["a1", "a2", "a3", "a4"],
@@ -348,8 +352,8 @@ def test_merge_one_chunk(setup):
348352
result = jdf.execute().fetch()
349353

350354
pd.testing.assert_frame_equal(
351-
expected.sort_values(by=expected.columns[1]).reset_index(drop=True),
352-
result.sort_values(by=result.columns[1]).reset_index(drop=True),
355+
sort_by_col1(expected).reset_index(drop=True),
356+
sort_by_col1(result).reset_index(drop=True),
353357
)
354358

355359
# right have one chunk
@@ -361,8 +365,8 @@ def test_merge_one_chunk(setup):
361365
result = jdf.execute().fetch()
362366

363367
pd.testing.assert_frame_equal(
364-
expected.sort_values(by=expected.columns[1]).reset_index(drop=True),
365-
result.sort_values(by=result.columns[1]).reset_index(drop=True),
368+
sort_by_col1(expected).reset_index(drop=True),
369+
sort_by_col1(result).reset_index(drop=True),
366370
)
367371

368372
# left have one chunk and how="left", then one chunk tile
@@ -377,8 +381,8 @@ def test_merge_one_chunk(setup):
377381
result = jdf.execute().fetch()
378382

379383
pd.testing.assert_frame_equal(
380-
expected.sort_values(by=expected.columns[1]).reset_index(drop=True),
381-
result.sort_values(by=result.columns[1]).reset_index(drop=True),
384+
sort_by_col1(expected).reset_index(drop=True),
385+
sort_by_col1(result).reset_index(drop=True),
382386
)
383387

384388

@@ -418,7 +422,8 @@ def test_broadcast_merge(setup):
418422
expected.set_index("key", inplace=True)
419423
result.set_index("key", inplace=True)
420424
pd.testing.assert_frame_equal(
421-
sort_dataframe_inplace(expected, 0), sort_dataframe_inplace(result, 0)
425+
sort_dataframe_inplace(expected, 0, kind="mergesort"),
426+
sort_dataframe_inplace(result, 0, kind="mergesort"),
422427
)
423428

424429
# test broadcast right and how="left"
@@ -438,8 +443,8 @@ def test_broadcast_merge(setup):
438443
expected.set_index("key", inplace=True)
439444
result.set_index("key", inplace=True)
440445
pd.testing.assert_frame_equal(
441-
expected.sort_values(by=["key", "value_x"]),
442-
result.sort_values(by=["key", "value_x"]),
446+
expected.sort_values(by=["key", "value_x"], kind="mergesort"),
447+
result.sort_values(by=["key", "value_x"], kind="mergesort"),
443448
)
444449

445450
# test broadcast left
@@ -459,7 +464,8 @@ def test_broadcast_merge(setup):
459464
expected.set_index("key", inplace=True)
460465
result.set_index("key", inplace=True)
461466
pd.testing.assert_frame_equal(
462-
sort_dataframe_inplace(expected, 0), sort_dataframe_inplace(result, 0)
467+
sort_dataframe_inplace(expected, 0, kind="mergesort"),
468+
sort_dataframe_inplace(result, 0, kind="mergesort"),
463469
)
464470

465471
# test broadcast left and how="right"
@@ -479,8 +485,8 @@ def test_broadcast_merge(setup):
479485
expected.set_index("key", inplace=True)
480486
result.set_index("key", inplace=True)
481487
pd.testing.assert_frame_equal(
482-
expected.sort_values(by=["key", "value_x"]),
483-
result.sort_values(by=["key", "value_x"]),
488+
expected.sort_values(by=["key", "value_x"], kind="mergesort"),
489+
result.sort_values(by=["key", "value_x"], kind="mergesort"),
484490
)
485491

486492

mars/dataframe/utils.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -106,9 +106,9 @@ def hash_dtypes(dtypes, size):
106106
return [dtypes[index] for index in hashed_indexes]
107107

108108

109-
def sort_dataframe_inplace(df, *axis):
109+
def sort_dataframe_inplace(df, *axis, **kw):
110110
for ax in axis:
111-
df.sort_index(axis=ax, inplace=True)
111+
df.sort_index(axis=ax, inplace=True, **kw)
112112
return df
113113

114114

mars/learn/contrib/lightgbm/core.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,6 @@
2020
import pandas as pd
2121

2222
from ....dataframe import DataFrame as MarsDataFrame, Series as MarsSeries
23-
from ....lib.version import parse as parse_version
2423
from ....tensor import tensor as mars_tensor
2524

2625

mars/learn/contrib/lightgbm/tests/test_classifier.py

Lines changed: 2 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -75,9 +75,7 @@ def test_local_classifier(create_cluster):
7575
# test sparse tensor
7676
X_sparse_data = X_sparse
7777
classifier = LGBMClassifier(n_estimators=2)
78-
classifier.fit(
79-
X_sparse_data, y_data, eval_set=[(X_sparse_data, y_data)]
80-
)
78+
classifier.fit(X_sparse_data, y_data, eval_set=[(X_sparse_data, y_data)])
8179
prediction = classifier.predict(X_sparse_data)
8280

8381
assert prediction.ndim == 1
@@ -118,9 +116,7 @@ def test_local_classifier(create_cluster):
118116

119117
# should raise error if weight.ndim > 1
120118
with pytest.raises(ValueError):
121-
LGBMClassifier(n_estimators=2).fit(
122-
X, y_df, sample_weight=mt.random.rand(1, 1)
123-
)
119+
LGBMClassifier(n_estimators=2).fit(X, y_df, sample_weight=mt.random.rand(1, 1))
124120

125121
# test binary classifier
126122
new_y = (y_data > 0.5).astype(mt.int32)

0 commit comments

Comments
 (0)