From 0f0cca64017a24f5adb18284a401208c8360b373 Mon Sep 17 00:00:00 2001 From: Phillip Cloud <417981+cpcloud@users.noreply.github.com> Date: Sun, 21 Jul 2024 10:47:18 -0400 Subject: [PATCH] feat(api): support selectors in window function `order_by` and `group_by` --- ibis/common/selectors.py | 49 +++++++++++++++++++++++++++++++ ibis/expr/builders.py | 6 ++-- ibis/expr/types/relations.py | 2 +- ibis/selectors.py | 42 ++------------------------ ibis/tests/expr/test_selectors.py | 23 +++++++++++++++ 5 files changed, 79 insertions(+), 43 deletions(-) create mode 100644 ibis/common/selectors.py diff --git a/ibis/common/selectors.py b/ibis/common/selectors.py new file mode 100644 index 000000000000..c74a8cfa4290 --- /dev/null +++ b/ibis/common/selectors.py @@ -0,0 +1,49 @@ +from __future__ import annotations + +import abc +from typing import TYPE_CHECKING + +from ibis.common.grounds import Concrete + +if TYPE_CHECKING: + from collections.abc import Sequence + + import ibis.expr.types as ir + + +class Selector(Concrete): + """A column selector.""" + + @abc.abstractmethod + def expand(self, table: ir.Table) -> Sequence[ir.Value]: + """Expand `table` into value expressions that match the selector. + + Parameters + ---------- + table + An ibis table expression + + Returns + ------- + Sequence[Value] + A sequence of value expressions that match the selector + + """ + + def positions(self, table: ir.Table) -> Sequence[int]: + """Expand `table` into column indices that match the selector. + + Parameters + ---------- + table + An ibis table expression + + Returns + ------- + Sequence[int] + A sequence of column indices where the selector matches + + """ + raise NotImplementedError( + f"`positions` doesn't make sense for {self.__class__.__name__} selector" + ) diff --git a/ibis/expr/builders.py b/ibis/expr/builders.py index 59d131123df0..8a82bac85adc 100644 --- a/ibis/expr/builders.py +++ b/ibis/expr/builders.py @@ -18,6 +18,8 @@ if TYPE_CHECKING: from typing_extensions import Self + from ibis.common.selectors import Selector + class Builder(Concrete): pass @@ -145,8 +147,8 @@ class WindowBuilder(Builder): how: Literal["rows", "range"] = "rows" start: Optional[RangeWindowBoundary] = None end: Optional[RangeWindowBoundary] = None - groupings: VarTuple[Union[str, Resolver, ops.Value]] = () - orderings: VarTuple[Union[str, Resolver, ops.SortKey]] = () + groupings: Selector | VarTuple[Union[str, Resolver, Selector, ops.Value]] = () + orderings: Selector | VarTuple[Union[str, Resolver, Selector, ops.SortKey]] = () @attribute def _table(self): diff --git a/ibis/expr/types/relations.py b/ibis/expr/types/relations.py index f66d6d64c0c0..0d461c8a4092 100644 --- a/ibis/expr/types/relations.py +++ b/ibis/expr/types/relations.py @@ -18,12 +18,12 @@ import ibis.expr.schema as sch from ibis import util from ibis.common.deferred import Deferred, Resolver +from ibis.common.selectors import Selector from ibis.expr.rewrites import DerefMap from ibis.expr.types.core import Expr, _FixedTextJupyterMixin from ibis.expr.types.generic import Value, literal from ibis.expr.types.pretty import to_rich from ibis.expr.types.temporal import TimestampColumn -from ibis.selectors import Selector from ibis.util import deprecated if TYPE_CHECKING: diff --git a/ibis/selectors.py b/ibis/selectors.py index 2f51a1592363..81c6aa03f55a 100644 --- a/ibis/selectors.py +++ b/ibis/selectors.py @@ -50,7 +50,6 @@ from __future__ import annotations -import abc import functools import inspect import operator @@ -67,45 +66,8 @@ from ibis.common.collections import frozendict # noqa: TCH001 from ibis.common.deferred import Deferred, Resolver from ibis.common.exceptions import IbisError -from ibis.common.grounds import Concrete, Singleton - - -class Selector(Concrete): - """A column selector.""" - - @abc.abstractmethod - def expand(self, table: ir.Table) -> Sequence[ir.Value]: - """Expand `table` into value expressions that match the selector. - - Parameters - ---------- - table - An ibis table expression - - Returns - ------- - Sequence[Value] - A sequence of value expressions that match the selector - - """ - - def positions(self, table: ir.Table) -> Sequence[int]: - """Expand `table` into column indices that match the selector. - - Parameters - ---------- - table - An ibis table expression - - Returns - ------- - Sequence[int] - A sequence of column indices where the selector matches - - """ - raise NotImplementedError( - f"`positions` doesn't make sense for {self.__class__.__name__} selector" - ) +from ibis.common.grounds import Singleton +from ibis.common.selectors import Selector class Predicate(Selector): diff --git a/ibis/tests/expr/test_selectors.py b/ibis/tests/expr/test_selectors.py index 62c7821e91af..fac48716345a 100644 --- a/ibis/tests/expr/test_selectors.py +++ b/ibis/tests/expr/test_selectors.py @@ -494,3 +494,26 @@ def test_order_by_with_selectors(penguins): with pytest.raises(exc.IbisError): penguins.order_by(~s.all()) + + +def test_window_function_group_by(penguins): + expr = penguins.species.count().over(group_by=s.c("island")) + assert expr.equals(penguins.species.count().over(group_by=penguins.island)) + + +def test_window_function_order_by(penguins): + expr = penguins.island.count().over(order_by=s.c("species")) + assert expr.equals(penguins.island.count().over(order_by=penguins.species)) + + +def test_window_function_group_by_order_by(penguins): + expr = penguins.species.count().over( + group_by=s.c("island"), + order_by=s.c("year") | (~s.c("island", "species") & s.of_type("str")), + ) + assert expr.equals( + penguins.species.count().over( + group_by=penguins.island, + order_by=[penguins.sex, penguins.year], + ) + )