Switched from black to ruff.

coady · Dec 22, 2023 · 47371bd · 47371bd
1 parent b174c06
commit 47371bd
Show file tree

Hide file tree

Showing 17 changed files with 236 additions and 226 deletions.
diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
@@ -34,7 +34,7 @@ jobs:
     - uses: actions/setup-python@v5
       with:
         python-version: 3.x
-    - run: pip install black ruff mypy
+    - run: pip install ruff mypy
     - run: make lint
 
   docs:

diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
@@ -20,5 +20,3 @@ jobs:
     - run: make html
     - run: PYTHONPATH=$PWD python -m mkdocs gh-deploy --force
     - uses: pypa/gh-action-pypi-publish@release/v1
-      with:
-        verbose: true
diff --git a/Makefile b/Makefile
@@ -2,8 +2,8 @@ check:
 	python -m pytest -s --cov
 
 lint:
-	black --check .
 	ruff .
+	ruff format --check .
 	mypy -p graphique
 
 html: docs/schema.md

diff --git a/README.md b/README.md
@@ -5,7 +5,6 @@
 [![image](https://github.com/coady/graphique/workflows/build/badge.svg)](https://github.com/coady/graphique/actions)
 [![image](https://codecov.io/gh/coady/graphique/branch/main/graph/badge.svg)](https://codecov.io/gh/coady/graphique/)
 [![image](https://github.com/coady/graphique/workflows/codeql/badge.svg)](https://github.com/coady/graphique/security/code-scanning)
-[![image](https://img.shields.io/badge/code%20style-black-000000.svg)](https://pypi.org/project/black/)
 [![image](https://img.shields.io/endpoint?url=https://raw.githubusercontent.com/astral-sh/ruff/main/assets/badge/v2.json)](https://github.com/astral-sh/ruff)
 [![image](https://mypy-lang.org/static/mypy_badge.svg)](https://mypy-lang.org/)
 

diff --git a/docs/examples.ipynb b/docs/examples.ipynb
@@ -37,15 +37,15 @@
    "outputs": [],
    "source": [
     "execute(\n",
-    "    '''{\n",
+    "    \"\"\"{\n",
     "  length\n",
     "  schema {\n",
     "    names\n",
     "    types\n",
     "    partitioning\n",
     "    index\n",
     "  }\n",
-    "}'''\n",
+    "}\"\"\"\n",
     ")"
    ]
   },
@@ -103,7 +103,7 @@
    "outputs": [],
    "source": [
     "execute(\n",
-    "    '''{\n",
+    "    \"\"\"{\n",
     "  filter(state: {eq: \"CA\"}) {\n",
     "    group(by: \"county\", aggregate: {countDistinct: {name: \"city\", alias: \"cities\"}}) {\n",
     "      sort(by: \"-cities\", length: 5) {\n",
@@ -120,7 +120,7 @@
     "      }\n",
     "    }\n",
     "  }\n",
-    "}'''\n",
+    "}\"\"\"\n",
     ")"
    ]
   },
@@ -141,7 +141,7 @@
    "outputs": [],
    "source": [
     "execute(\n",
-    "    '''{\n",
+    "    \"\"\"{\n",
     "  scan(filter: {eq: [{name: \"county\"}, {name: \"city\"}]}) {\n",
     "    columns {\n",
     "      state {\n",
@@ -152,7 +152,7 @@
     "      }\n",
     "    }\n",
     "  }\n",
-    "}'''\n",
+    "}\"\"\"\n",
     ")"
    ]
   },
@@ -177,7 +177,7 @@
    "outputs": [],
    "source": [
     "execute(\n",
-    "    '''{\n",
+    "    \"\"\"{\n",
     "  scan(columns: {alias: \"match\", eq: [{name: \"county\"}, {name: \"city\"}]}) {\n",
     "    group(by: \"state\", aggregate: {any: {name: \"match\"}}) {\n",
     "      scan(filter: {inv: {name: \"match\"}}) {\n",
@@ -189,7 +189,7 @@
     "      }\n",
     "    }\n",
     "  }\n",
-    "}'''\n",
+    "}\"\"\"\n",
     ")"
    ]
   }

diff --git a/graphique/core.py b/graphique/core.py
@@ -4,6 +4,7 @@
 Arrow forbids subclassing, so the classes are for logical grouping.
 Their methods are called as functions.
 """
+
 import bisect
 import contextlib
 import functools
@@ -106,7 +107,10 @@ def register(func: Callable, kind: str = 'scalar') -> pc.Function:
 
 @register
 def digitize(
-    ctx, array: pa.float64(), bins: pa.list_(pa.float64()), right: pa.bool_()  # type: ignore
+    ctx,
+    array: pa.float64(),  # type: ignore
+    bins: pa.list_(pa.float64()),  # type: ignore
+    right: pa.bool_(),  # type: ignore
 ) -> pa.int64():  # type: ignore
     """Return the indices of the bins to which each value in input array belongs."""
     return pa.array(np.digitize(array, bins.values, right.as_py()))

diff --git a/graphique/inputs.py b/graphique/inputs.py
@@ -1,6 +1,7 @@
 """
 GraphQL input types.
 """
+
 import functools
 import inspect
 import operator

diff --git a/graphique/interface.py b/graphique/interface.py
@@ -3,6 +3,7 @@
 
 Doesn't require knowledge of the schema.
 """
+
 # mypy: disable-error-code=valid-type
 import collections
 import inspect
@@ -234,7 +235,11 @@ def slice(
         aggregate="aggregation functions applied to other columns",
     )
     def group(
-        self, info: Info, by: list[str] = [], counts: str = '', aggregate: HashAggregates = {}  # type: ignore
+        self,
+        info: Info,
+        by: list[str] = [],
+        counts: str = '',
+        aggregate: HashAggregates = {},  # type: ignore
     ) -> Self:
         """Return table grouped by columns.
 
@@ -497,9 +502,7 @@ def oneshot(cls, info: Info, scanner: ds.Scanner) -> Union[ds.Scanner, pa.Table]
         return scanner
 
     @doc_field(filter="selected rows", columns="projected columns")
-    def scan(
-        self, info: Info, filter: Expression = {}, columns: list[Projection] = []  # type: ignore
-    ) -> Self:
+    def scan(self, info: Info, filter: Expression = {}, columns: list[Projection] = []) -> Self:  # type: ignore
         """Select rows and project columns without memory usage."""
         expr = filter.to_arrow()
         if expr is not None and not columns and isinstance(self.table, ds.Dataset):

diff --git a/graphique/middleware.py b/graphique/middleware.py
@@ -1,6 +1,7 @@
 """
 ASGI GraphQL utilities.
 """
+
 import warnings
 from collections.abc import Iterable, Mapping
 from datetime import timedelta

diff --git a/graphique/models.py b/graphique/models.py
@@ -1,6 +1,7 @@
 """
 GraphQL output types and resolvers.
 """
+
 import collections
 import functools
 import inspect
@@ -174,8 +175,7 @@ def fill_null(self, value: T) -> list[T]:
 
 @Column.register(str)
 @strawberry.type(name='ingColumn', description="column of strings")
-class StringColumn(OrdinalColumn[T]):
-    ...
+class StringColumn(OrdinalColumn[T]): ...
 
 
 @strawberry.type

diff --git a/graphique/scalars.py b/graphique/scalars.py
@@ -1,6 +1,7 @@
 """
 GraphQL scalars.
 """
+
 from datetime import date, datetime, time, timedelta
 from decimal import Decimal
 import pyarrow as pa

diff --git a/graphique/service.py b/graphique/service.py
@@ -6,6 +6,7 @@
 * datasets, scanners, and tables
 * filtering and projection
 """
+
 import json
 from pathlib import Path
 import pyarrow.dataset as ds

diff --git a/graphique/shell.py b/graphique/shell.py
@@ -8,6 +8,7 @@
 sufficient once partitioned, but there is a `fragments` option to optimize for memory or show
 progress on the second pass.
 """
+
 import argparse
 import shutil
 from pathlib import Path

diff --git a/pyproject.toml b/pyproject.toml
@@ -49,12 +49,13 @@ version = {attr = "graphique.__version__"}
 [tool.setuptools.package-data]
 graphique = ["py.typed"]
 
-[tool.black]
+[tool.ruff]
 line-length = 100
-skip-string-normalization = true
+extend-include = ["*.ipynb"]
 
-[tool.ruff]
-ignore = ["E501"]
+[tool.ruff.format]
+preview = true
+quote-style = "preserve"
 
 [[tool.mypy.overrides]]
 module = ["pyarrow.*", "strawberry.*", "starlette.*"]

diff --git a/tests/test_dataset.py b/tests/test_dataset.py
@@ -40,18 +40,18 @@ def test_search(dsclient):
     data = dsclient.execute('{ filter(zipcode: {}) { row { zipcode } } }')
     assert data == {'filter': {'row': {'zipcode': 501}}}
     data = dsclient.execute(
-        '''{ filter(zipcode: {gt: 90000}) { filter(state: {eq: "CA"}) {
-        length } } }'''
+        """{ filter(zipcode: {gt: 90000}) { filter(state: {eq: "CA"}) {
+        length } } }"""
     )
     assert data == {'filter': {'filter': {'length': 2647}}}
     data = dsclient.execute(
-        '''{ filter(zipcode: {gt: 90000}) { filter(state: {eq: "CA"}) {
-        length row { zipcode } } } }'''
+        """{ filter(zipcode: {gt: 90000}) { filter(state: {eq: "CA"}) {
+        length row { zipcode } } } }"""
     )
     assert data == {'filter': {'filter': {'length': 2647, 'row': {'zipcode': 90001}}}}
     data = dsclient.execute(
-        '''{ filter(zipcode: {lt: 90000}) { filter(state: {eq: "CA"}) {
-        group(by: "county") { length } } } }'''
+        """{ filter(zipcode: {lt: 90000}) { filter(state: {eq: "CA"}) {
+        group(by: "county") { length } } } }"""
     )
     assert data == {'filter': {'filter': {'group': {'length': 0}}}}
 
@@ -75,12 +75,12 @@ def test_slice(dsclient):
 
 def test_group(dsclient):
     data = dsclient.execute(
-        '''{ group(by: ["state"], aggregate: {min: {name: "county"}}) { row { state county } } }'''
+        """{ group(by: ["state"], aggregate: {min: {name: "county"}}) { row { state county } } }"""
     )
     assert data == {'group': {'row': {'state': 'NY', 'county': 'Albany'}}}
     data = dsclient.execute(
-        '''{ group(by: ["state"], counts: "c") { slice(length: 1) {
-        column(name: "c") { ... on LongColumn { values } } } } }'''
+        """{ group(by: ["state"], counts: "c") { slice(length: 1) {
+        column(name: "c") { ... on LongColumn { values } } } } }"""
     )
     assert data == {'group': {'slice': {'column': {'values': [2205]}}}}
     data = dsclient.execute(
@@ -92,34 +92,34 @@ def test_group(dsclient):
     )
     assert data['group']['row']['county']
     data = dsclient.execute(
-        '''{ group(by: ["state"], aggregate: {mean: {name: "zipcode"}}) { slice(length: 1) {
-        column(name: "zipcode") { ... on FloatColumn { values } } } } }'''
+        """{ group(by: ["state"], aggregate: {mean: {name: "zipcode"}}) { slice(length: 1) {
+        column(name: "zipcode") { ... on FloatColumn { values } } } } }"""
     )
     assert data == {'group': {'slice': {'column': {'values': [pytest.approx(12614.62721)]}}}}
     data = dsclient.execute(
-        '''{ group(by: ["state"], aggregate: {list: {name: "zipcode"}}) { aggregate(mean: {name: "zipcode"}) {
-        slice(length: 1) { column(name: "zipcode") { ... on FloatColumn { values } } } } } }'''
+        """{ group(by: ["state"], aggregate: {list: {name: "zipcode"}}) { aggregate(mean: {name: "zipcode"}) {
+        slice(length: 1) { column(name: "zipcode") { ... on FloatColumn { values } } } } } }"""
     )
     assert data == {
         'group': {'aggregate': {'slice': {'column': {'values': [pytest.approx(12614.62721)]}}}}
     }
     data = dsclient.execute(
-        '''{ group(aggregate: {min: {alias: "st", name: "state"}}) {
-        column(name: "st") { ... on StringColumn { values } } } }'''
+        """{ group(aggregate: {min: {alias: "st", name: "state"}}) {
+        column(name: "st") { ... on StringColumn { values } } } }"""
     )
     assert data == {'group': {'column': {'values': ['AK']}}}
 
 
 def test_list(partclient):
     data = partclient.execute(
-        '''{ group(by: "state", aggregate: {distinct: {alias: "counties", name: "county"}}) {
-        tables { row { state } column(name: "counties") { length } } } } '''
+        """{ group(by: "state", aggregate: {distinct: {alias: "counties", name: "county"}}) {
+        tables { row { state } column(name: "counties") { length } } } } """
     )
     (table,) = [table for table in data['group']['tables'] if table['row']['state'] == 'PR']
     assert table == {'row': {'state': 'PR'}, 'column': {'length': 78}}
     data = partclient.execute(
-        '''{ group(by: "north", aggregate: {distinct: {name: "west"}}) {
-        tables { row { north } columns { west { length } } } } }'''
+        """{ group(by: "north", aggregate: {distinct: {name: "west"}}) {
+        tables { row { north } columns { west { length } } } } }"""
     )
     tables = data['group']['tables']
     assert {table['row']['north'] for table in tables} == {0, 1}
@@ -147,13 +147,13 @@ def test_fragments(partclient):
     )
     assert data == {'group': {'length': 1, 'row': {'state': 'AK'}}}
     data = partclient.execute(
-        '''{ group(by: ["north", "west"], aggregate: {distinct: {name: "city"}, mean: {name: "zipcode"}}) {
-        length column(name: "city") { type } } }'''
+        """{ group(by: ["north", "west"], aggregate: {distinct: {name: "city"}, mean: {name: "zipcode"}}) {
+        length column(name: "city") { type } } }"""
     )
     assert data == {'group': {'length': 4, 'column': {'type': 'large_list<item: string>'}}}
     data = partclient.execute(
-        '''{ group(by: "north", aggregate: {countDistinct: {name: "west"}}) { 
-        column(name: "west") { ... on LongColumn { values } } } }'''
+        """{ group(by: "north", aggregate: {countDistinct: {name: "west"}}) { 
+        column(name: "west") { ... on LongColumn { values } } } }"""
     )
     assert data == {'group': {'column': {'values': [2, 2]}}}
     data = partclient.execute(
@@ -204,14 +204,14 @@ def test_scan(dsclient):
     with pytest.raises(ValueError, match="name or alias"):
         dsclient.execute('{ scan(columns: {}) { length } }')
     data = dsclient.execute(
-        '''{ scan(filter: {eq: [{name: "state"}, {value: "CA"}]})
+        """{ scan(filter: {eq: [{name: "state"}, {value: "CA"}]})
         { scan(filter: {eq: [{name: "county"}, {value: "Santa Clara"}]})
-        { length row { county } } } }'''
+        { length row { county } } } }"""
     )
     assert data == {'scan': {'scan': {'length': 108, 'row': {'county': 'Santa Clara'}}}}
     data = dsclient.execute(
-        '''{ scan(filter: {or: [{eq: [{name: "state"}, {value: "CA"}]},
-        {eq: [{name: "county"}, {value: "Santa Clara"}]}]}) { length } }'''
+        """{ scan(filter: {or: [{eq: [{name: "state"}, {value: "CA"}]},
+        {eq: [{name: "county"}, {value: "Santa Clara"}]}]}) { length } }"""
     )
     assert data == {'scan': {'length': 2647}}
 
@@ -256,30 +256,30 @@ def test_federation(fedclient):
     assert data['zipDb'] == {'__typename': 'ZipDbTable', 'length': 42724}
 
     data = fedclient.execute(
-        '''{ zipcodes { scan(columns: {name: "zipcode", cast: "int64"}) {
-        join(right: "zip_db", keys: "zipcode", rightKeys: "zip") { length schema { names } } } } }'''
+        """{ zipcodes { scan(columns: {name: "zipcode", cast: "int64"}) {
+        join(right: "zip_db", keys: "zipcode", rightKeys: "zip") { length schema { names } } } } }"""
     )
     table = data['zipcodes']['scan']['join']
     assert table['length'] == 41700
     assert set(table['schema']['names']) > {'zipcode', 'timezone', 'latitude'}
     data = fedclient.execute(
-        '''{ zipcodes { scan(columns: {alias: "zip", name: "zipcode", cast: "int64"}) {
-        join(right: "zip_db", keys: "zip", joinType: "right outer") { length schema { names } } } } }'''
+        """{ zipcodes { scan(columns: {alias: "zip", name: "zipcode", cast: "int64"}) {
+        join(right: "zip_db", keys: "zip", joinType: "right outer") { length schema { names } } } } }"""
     )
     table = data['zipcodes']['scan']['join']
     assert table['length'] == 42724
     assert set(table['schema']['names']) > {'zip', 'timezone', 'latitude'}
 
     data = fedclient.execute(
-        '''{ _entities(representations: {__typename: "ZipcodesTable", zipcode: 90001}) {
-        ... on ZipcodesTable { length row { state } schema { names } } } }'''
+        """{ _entities(representations: {__typename: "ZipcodesTable", zipcode: 90001}) {
+        ... on ZipcodesTable { length row { state } schema { names } } } }"""
     )
     assert data == {
         '_entities': [{'length': 1, 'row': {'state': 'CA'}, 'schema': {'names': ['state']}}]
     }
     data = fedclient.execute(
-        '''{ states { filter(state: {eq: "CA"}) { columns { indices {
-        takeFrom(field: "zipcodes") { __typename column(name: "state") { length } } } } } } }'''
+        """{ states { filter(state: {eq: "CA"}) { columns { indices {
+        takeFrom(field: "zipcodes") { __typename column(name: "state") { length } } } } } } }"""
     )
     table = data['states']['filter']['columns']['indices']['takeFrom']
     assert table == {'__typename': 'ZipcodesTable', 'column': {'length': 2647}}