coiled · hendrikmakait · Oct 30, 2024
diff --git a/tests/geospatial/test_cloud_optimize.py b/tests/geospatial/test_cloud_optimize.py
@@ -16,6 +16,21 @@ def test_cloud_optimize(
         "large": {"n_workers": 200},
     },
 ):
+    """
+    This benchmark loads the NASA Earth Exchange Global Daily Downscaled Projections (NEX-GDDP-CMIP6)
+    dataset stored in NetCDF, rechunks it from time-oriented chunks to spatial chunks, and writes it
+    to a Zarr dataset.
+
+    The benchmark can be scaled across these dimensions:
+
+    * Models
+    * Variables
+    * Time
+    * Space
+    * Cluster size
+
+    At the moment, it is not scaled along the temporal or spatial dimensions.
+    """
     with client_factory(
         **scale_kwargs[scale], **cluster_kwargs
     ) as client:  # noqa: F841
@@ -96,5 +111,5 @@ def test_cloud_optimize(
         # Rechunk from "pancake" to "pencil" format
         ds = ds.chunk({"time": -1, "lon": "auto", "lat": "auto"})
 
-        # Write out to a Zar dataset
+        # Write out to a Zarr dataset
         ds.to_zarr(s3_url)
diff --git a/tests/geospatial/test_satellite_filtering.py b/tests/geospatial/test_satellite_filtering.py
@@ -67,6 +67,18 @@ def test_satellite_filtering(
         "large": {"n_workers": 100},
     },
 ):
+    """
+    This benchmark processes Sentinel-2 satellite imagery. It computes the monthly average of a humidity index
+    and stores the result to a Zarr dataset.
+
+    The benchmark can be scaled across these dimensions:
+    * Indices to calculate
+    * Time
+    * Space
+    * Cluster size
+
+    At the moment, the spatial extent is fixed to Germany and only a single index is derived.
+    """
     with client_factory(
         **scale_kwargs[scale],
         env={