From 8c70ed8ee36f44698af47c01ee397e13597301a9 Mon Sep 17 00:00:00 2001 From: ritchie Date: Fri, 27 Dec 2024 16:52:57 +0100 Subject: [PATCH] fix: Don't remove sort if first/last strategy is set in unique --- .../src/plans/optimizer/set_order.rs | 7 +++++- .../unit/operations/unique/test_unique.py | 25 +++++++++++++++++++ 2 files changed, 31 insertions(+), 1 deletion(-) diff --git a/crates/polars-plan/src/plans/optimizer/set_order.rs b/crates/polars-plan/src/plans/optimizer/set_order.rs index 022529fbf9a9..b6d360cc56db 100644 --- a/crates/polars-plan/src/plans/optimizer/set_order.rs +++ b/crates/polars-plan/src/plans/optimizer/set_order.rs @@ -101,7 +101,12 @@ pub(super) fn set_order_flags( options.maintain_order = false; continue; } - if !options.maintain_order { + if matches!( + options.keep_strategy, + UniqueKeepStrategy::First | UniqueKeepStrategy::Last + ) { + maintain_order_above = true; + } else if !options.maintain_order { maintain_order_above = false; } }, diff --git a/py-polars/tests/unit/operations/unique/test_unique.py b/py-polars/tests/unit/operations/unique/test_unique.py index c15db38da503..d986c1d4282e 100644 --- a/py-polars/tests/unit/operations/unique/test_unique.py +++ b/py-polars/tests/unit/operations/unique/test_unique.py @@ -175,3 +175,28 @@ def test_categorical_updated_revmap_unique_20233() -> None: ) assert_series_equal(s.unique(), pl.Series("a", ["D"], pl.Categorical)) + + +def test_unique_check_order_20480() -> None: + df = pl.DataFrame( + [ + { + "key": "some_key", + "value": "second", + "number": 2, + }, + { + "key": "some_key", + "value": "first", + "number": 1, + }, + ] + ) + assert ( + df.lazy() + .sort("key", "number") + .unique(subset="key", keep="first") + .collect()["number"] + .item() + == 1 + )