From 36dcc86df44fb6c057854a5e2086aeee9b41c97a Mon Sep 17 00:00:00 2001 From: Hendrik Makait Date: Wed, 30 Oct 2024 16:13:41 +0100 Subject: [PATCH] Add descriptions --- tests/geospatial/test_cloud_optimize.py | 17 ++++++++++++++++- tests/geospatial/test_satellite_filtering.py | 12 ++++++++++++ 2 files changed, 28 insertions(+), 1 deletion(-) diff --git a/tests/geospatial/test_cloud_optimize.py b/tests/geospatial/test_cloud_optimize.py index f3a15f5e74..32f143f9c6 100644 --- a/tests/geospatial/test_cloud_optimize.py +++ b/tests/geospatial/test_cloud_optimize.py @@ -16,6 +16,21 @@ def test_cloud_optimize( "large": {"n_workers": 200}, }, ): + """ + This benchmark loads the NASA Earth Exchange Global Daily Downscaled Projections (NEX-GDDP-CMIP6) + dataset stored in NetCDF, rechunks it from time-oriented chunks to spatial chunks, and writes it + to a Zarr dataset. + + The benchmark can be scaled across these dimensions: + + * Models + * Variables + * Time + * Space + * Cluster size + + At the moment, it is not scaled along the temporal or spatial dimensions. + """ with client_factory( **scale_kwargs[scale], **cluster_kwargs ) as client: # noqa: F841 @@ -96,5 +111,5 @@ def test_cloud_optimize( # Rechunk from "pancake" to "pencil" format ds = ds.chunk({"time": -1, "lon": "auto", "lat": "auto"}) - # Write out to a Zar dataset + # Write out to a Zarr dataset ds.to_zarr(s3_url) diff --git a/tests/geospatial/test_satellite_filtering.py b/tests/geospatial/test_satellite_filtering.py index b6049e95ee..a58bb90625 100644 --- a/tests/geospatial/test_satellite_filtering.py +++ b/tests/geospatial/test_satellite_filtering.py @@ -67,6 +67,18 @@ def test_satellite_filtering( "large": {"n_workers": 100}, }, ): + """ + This benchmark processes Sentinel-2 satellite imagery. It computes the monthly average of a humidity index + and stores the result to a Zarr dataset. + + The benchmark can be scaled across these dimensions: + * Indices to calculate + * Time + * Space + * Cluster size + + At the moment, the spatial extent is fixed to Germany and only a single index is derived. + """ with client_factory( **scale_kwargs[scale], env={