gjoseph92 · gjoseph92 · Jul 23, 2023 · Jun 13, 2023 · Jun 13, 2023 · Jun 14, 2023
diff --git a/pyproject.toml b/pyproject.toml
@@ -15,7 +15,7 @@ license = {text = "MIT"}
 name = "stackstac"
 readme = "README.md"
 requires-python = ">=3.8,<4.0"
-version = "0.4.3"
+version = "0.4.4"
-version = "0.4.4"
+version = "0.4.3"
-version = "0.4.4"
+version = "0.4.3"
 
 [project.urls]
 homepage = "https://stackstac.readthedocs.io/en/latest/index.html"

diff --git a/stackstac/prepare.py b/stackstac/prepare.py
@@ -26,7 +26,7 @@
 from .stac_types import ItemSequence
 from . import accumulate_metadata, geom_utils
 
-ASSET_TABLE_DT = np.dtype([("url", object), ("bounds", "float64", 4)])
+ASSET_TABLE_DT = np.dtype([("url", object), ("bounds", "float64", 4), ("scale_offset", "float64", 2)])
 
 
 class Mimetype(NamedTuple):
@@ -143,6 +143,15 @@ def prepare_items(
             asset_bbox = asset.get("proj:bbox", item_bbox)
             asset_shape = asset.get("proj:shape", item_shape)
             asset_transform = asset.get("proj:transform", item_transform)
+            raster_bands = asset.get('raster:bands')
+            if raster_bands is not None:
+                try:
+                    assert len(raster_bands) == 1
+                    asset_scale = raster_bands[0].get('scale', np.nan)
+                    asset_offset = raster_bands[0].get('offset', np.nan)
+                except AssertionError:
+                    raise ValueError(f'raster:bands has more than one element for asset {asset_id}.')
-                try:
-                    assert len(raster_bands) == 1
-                    asset_scale = raster_bands[0].get('scale', np.nan)
-                    asset_offset = raster_bands[0].get('offset', np.nan)
-                except AssertionError:
-                    raise ValueError(f'raster:bands has more than one element for asset {asset_id}.')
+                if len(raster_bands) != 1:
+                    raise ValueError(
+                        f"raster:bands has {len(raster_bands)} elements for asset {asset_id!r}. "
+                        "Multi-band rasters are not currently supported.\n"
+                        "If you don't care about this asset, you can skip it by giving a list "
+                        "of asset IDs you *do* want in `assets=`, and leaving this one out."
+                    )
+                asset_scale = raster_bands[0].get('scale', np.nan)
+                asset_offset = raster_bands[0].get('offset', np.nan)
-                try:
-                    assert len(raster_bands) == 1
-                    asset_scale = raster_bands[0].get('scale', np.nan)
-                    asset_offset = raster_bands[0].get('offset', np.nan)
-                except AssertionError:
-                    raise ValueError(f'raster:bands has more than one element for asset {asset_id}.')
+                if len(raster_bands) != 1:
+                    raise ValueError(
+                        f"raster:bands has {len(raster_bands)} elements for asset {asset_id!r}. "
+                        "Multi-band rasters are not currently supported.\n"
+                        "If you don't care about this asset, you can skip it by giving a list "
+                        "of asset IDs you *do* want in `assets=`, and leaving this one out."
+                    )
+                asset_scale = raster_bands[0].get('scale', np.nan)
+                asset_offset = raster_bands[0].get('offset', np.nan)
+
             asset_affine = None
 
             # Auto-compute CRS
@@ -322,7 +331,7 @@ def prepare_items(
                     continue
 
             # Phew, we figured out all the spatial stuff! Now actually store the information we care about.
-            asset_table[item_i, asset_i] = (asset["href"], asset_bbox_proj)
+            asset_table[item_i, asset_i] = (asset["href"], asset_bbox_proj, (asset_scale, asset_offset))
             # ^ NOTE: If `asset_bbox_proj` is None, NumPy automatically converts it to NaNs
 
     # At this point, everything has been set (or there was as error)

diff --git a/stackstac/rio_reader.py b/stackstac/rio_reader.py
@@ -32,7 +32,6 @@ def _curthread():
 
 # /TODO
 
-
 # Default GDAL configuration options
 DEFAULT_GDAL_ENV = LayeredEnv(
     always=dict(
@@ -65,6 +64,7 @@ def _curthread():
 # https://github.com/pangeo-data/pangeo-example-notebooks/issues/21#issuecomment-432457955
 # https://gdal.org/drivers/raster/vrt.html#multi-threading-issues
 MULTITHREADED_DRIVER_ALLOWLIST = {"GTiff"}
+INTEGER_DTYPES = ['int', 'uint8', 'int8', 'uint16', 'int16']
 
 
 class ThreadsafeRioDataset(Protocol):
@@ -304,6 +304,7 @@ def __init__(
         dtype: np.dtype,
         fill_value: Union[int, float],
         rescale: bool,
+        scale_offset: Tuple[float, float],
         gdal_env: Optional[LayeredEnv] = None,
         errors_as_nodata: Tuple[Exception, ...] = (),
     ) -> None:
@@ -312,6 +313,7 @@ def __init__(
         self.resampling = resampling
         self.dtype = dtype
         self.rescale = rescale
+        self.scale_offset = scale_offset
         self.fill_value = fill_value
         self.gdal_env = gdal_env or DEFAULT_GDAL_ENV
         self.errors_as_nodata = errors_as_nodata
@@ -399,14 +401,23 @@ def read(self, window: Window, **kwargs) -> np.ndarray:
 
             raise RuntimeError(msg) from e
 
+        if result.dtype != self.dtype:
+            result = result.astype(self.dtype, copy=False)
+
         if self.rescale:
-            scale, offset = reader.scale_offset
+            scale, offset = self.scale_offset
+
+            if np.isnan(scale) or np.isnan(offset):
+                scale, offset = reader.scale_offset
+
             if scale != 1:
+                if self.dtype in INTEGER_DTYPES:
+                    raise ValueError(f'Requested asset dtype ({self.dtype}) is not compatible with '
+                                     f'asset scale value dtype ({scale.dtype}).')
                 result *= scale
             if offset != 0:
                 result += offset
 
-        result = result.astype(self.dtype, copy=False)
         result = np.ma.filled(result, fill_value=self.fill_value)
         return result
 

diff --git a/stackstac/to_dask.py b/stackstac/to_dask.py
@@ -132,6 +132,7 @@ def asset_table_to_reader_and_window(
         if url:
             asset_bounds: Bbox = asset_entry["bounds"]
             asset_window = windows.from_bounds(*asset_bounds, spec.transform)
+            asset_scale_offset = asset_entry["scale_offset"]
 
             entry: ReaderTableEntry = (
                 reader(
@@ -141,6 +142,7 @@ def asset_table_to_reader_and_window(
                     dtype=dtype,
                     fill_value=fill_value,
                     rescale=rescale,
+                    scale_offset=asset_scale_offset,
                     gdal_env=gdal_env,
                     errors_as_nodata=errors_as_nodata,
                 ),