diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml index 7cfd56ed..05d2bfcb 100644 --- a/.github/workflows/ci.yml +++ b/.github/workflows/ci.yml @@ -16,7 +16,7 @@ jobs: runs-on: ubuntu-latest strategy: matrix: - python-version: ['3.7', '3.8', '3.9'] + python-version: ['3.8', '3.9', '3.10'] steps: - uses: actions/checkout@v2 @@ -28,17 +28,16 @@ jobs: - name: Install dependencies run: | python -m pip install --upgrade pip - python -m pip install pre-commit codecov - - - name: Install module - run: python -m pip install .["test"] + python -m pip install -e .["test"] - name: Run pre-commit if: ${{ matrix.python-version == env.LATEST_PY_VERSION }} - run: pre-commit run --all-files + run: | + python -m pip install pre-commit + pre-commit run --all-files - name: Run tests - run: python -m pytest --cov rio_tiler --cov-report xml --cov-report term-missing --benchmark-skip + run: python -m pytest --cov rio_tiler --cov-report xml --cov-report term-missing --benchmark-skip -s -vv - name: Upload Results if: ${{ matrix.python-version == env.LATEST_PY_VERSION }} @@ -73,20 +72,20 @@ jobs: - name: Run Benchmark run: python -m pytest --benchmark-only --benchmark-autosave --benchmark-columns 'min, max, mean, median' --benchmark-sort 'min' --benchmark-json output.json - - name: Store and Compare benchmark result - uses: benchmark-action/github-action-benchmark@v1 - with: - name: rio-tiler Benchmarks - tool: 'pytest' - output-file-path: output.json - alert-threshold: '130%' - comment-on-alert: true - fail-on-alert: true - # GitHub API token to make a commit comment - github-token: ${{ secrets.GITHUB_TOKEN }} - # Make a commit on `gh-pages` only if master - auto-push: ${{ github.ref == 'refs/heads/master' }} - benchmark-data-dir-path: benchmarks + # - name: Store and Compare benchmark result + # uses: benchmark-action/github-action-benchmark@v1 + # with: + # name: rio-tiler Benchmarks + # tool: 'pytest' + # output-file-path: output.json + # alert-threshold: '130%' + # comment-on-alert: true + # fail-on-alert: true + # # GitHub API token to make a commit comment + # github-token: ${{ secrets.GITHUB_TOKEN }} + # # Make a commit on `gh-pages` only if master + # auto-push: ${{ github.ref == 'refs/heads/master' }} + # benchmark-data-dir-path: benchmarks publish: needs: [tests] diff --git a/.github/workflows/deploy_mkdocs.yml b/.github/workflows/deploy_mkdocs.yml index 97bdf800..336a99d1 100644 --- a/.github/workflows/deploy_mkdocs.yml +++ b/.github/workflows/deploy_mkdocs.yml @@ -44,8 +44,9 @@ jobs: rio_tiler.expression \ rio_tiler.models \ rio_tiler.io.base \ - rio_tiler.io.cogeo \ + rio_tiler.io.rasterio \ rio_tiler.io.stac \ + rio_tiler.io.xarray \ rio_tiler.mosaic.methods.base \ rio_tiler.mosaic.methods.defaults \ rio_tiler.mosaic.reader \ diff --git a/.gitignore b/.gitignore index 5f96ea0b..87350fa2 100644 --- a/.gitignore +++ b/.gitignore @@ -108,4 +108,4 @@ tests/benchmarks/data/* tests/fixtures/mask* .vscode/settings.json -docs/api* +docs/src/api/* diff --git a/CHANGES.md b/CHANGES.md index e207d274..5615dfdc 100644 --- a/CHANGES.md +++ b/CHANGES.md @@ -1,4 +1,162 @@ +# 4.0.0 (TBD) + +* add python 3.10 support +* add `apply_expression` method in `rio_tiler.models.ImageData` class +* update `rio-tiler.reader.read/part` to avoid using WarpedVRT when no *reprojection* or *nodata override* is needed +* add `rio_tiler.io.rasterio.ImageReader` to work either with Non-geo or Geo images in a Non-geo manner (a.k.a: in the pixel coordinates system) + ```python + with ImageReader("image.jpg") as src: + im = src.part((0, 100, 100, 0)) + + with ImageReader("image.jpg") as src: + im = src.tile(0, 0, src.maxzoom) + print(im.bounds) + + >>> BoundingBox(left=0.0, bottom=256.0, right=256.0, top=0.0) + ``` + +* add `rio_tiler.io.xarray.XarrayReader` to work with `xarray.DataArray` + ```python + import xarray + from rio_tiler.io import XarrayReader + + with xarray.open_dataset( + "https://ncsa.osn.xsede.org/Pangeo/pangeo-forge/noaa-coastwatch-geopolar-sst-feedstock/noaa-coastwatch-geopolar-sst.zarr", + engine="zarr", + decode_coords="all" + ) as src: + ds = src["analysed_sst"][:1] + ds.rio.write_crs("epsg:4326", inplace=True) + + with XarrayReader(ds) as dst: + img = dst.tile(1, 1, 2) + ``` + note: `xarray` and `rioxarray` optional dependencies are needed for the reader + +**breaking changes** + +* remove python 3.7 support +* update rasterio requirement to `>=1.3` to allow python 3.10 support +* rename `rio_tiler.io.cogeo` to `rio_tiler.io.rasterio` +* rename `COGReader` to `Reader`. We added `rio_tiler.io.COGReader` alias to `rio_tiler.io.Reader` backwards compatibility + ```python + # before + from rio_tiler.io import COGReader + from rio_tiler.io.cogeo import COGReader + + # now + from rio_tiler.io import Reader + from rio_tiler.io.rasterio import Reader + ``` + +* `rio_tiler.readers.read()`, `rio_tiler.readers.part()`, `rio_tiler.readers.preview()` now return a ImageData object +* remove `minzoom` and `maxzoom` attribute in `rio_tiler.io.SpatialMixin` base class +* remove `minzoom` and `maxzoom` attribute in `rio_tiler.io.Reader` (now defined as properties) +* use `b` prefix for band names in `rio_tiler.models.ImageData` class (and in rio-tiler's readers) + ```python + # before + with COGReader("cog.tif") as cog: + img = cog.read() + print(cog.band_names) + >>> ["1", "2", "3"] + + print(cog.info().band_metadata) + >>> [("1", {}), ("2", {}), ("3", {})] + + print(cog.info().band_descriptions) + >>> [("1", ""), ("2", ""), ("3", "")] + + print(list(cog.statistics())) + >>> ["1", "2", "3"] + + # now + with Reader("cog.tif") as cog: + img = cog.read() + print(img.band_names) + >>> ["b1", "b2", "b3"] + + print(cog.info().band_metadata) + >>> [("b1", {}), ("b2", {}), ("b3", {})] + + print(cog.info().band_descriptions) + >>> [("b1", ""), ("b2", ""), ("b3", "")] + + print(list(cog.statistics())) + >>> ["b1", "b2", "b3"] + + with STACReader("stac.json") as stac: + print(stac.tile(701, 102, 8, assets=("green", "red")).band_names) + >>> ["green_b1", "red_b1"] + ``` + +* depreciate `asset_expression` in MultiBaseReader. Use of expression is now possible +* `expression` for MultiBaseReader must be in form of `{asset}_b{index}` + + ```python + # before + with STACReader("stac.json") as stac: + stac.tile(701, 102, 8, expression="green/red") + + # now + with STACReader("stac.json") as stac: + stac.tile(701, 102, 8, expression="green_b1/red_b1") + ``` + +* `rio_tiler.reader.point()` (and all Reader's point methods) now return a **rio_tiler.models.PointData** object + + ```python + # before + with rasterio.open("cog.tif") as src:: + v = rio_tiler.reader.point(10.20, -42.0) + print(v) + >>> [0, 0, 0] + + with COGReader("cog.tif") as cog: + print(cog.point(10.20, -42.0)) + >>> [0, 0, 0] + + # now + with rasterio.open("cog.tif") as src:: + v = rio_tiler.reader.point(src, (10.20, -42)) + print(v) + >>> PointData( + data=array([3744], dtype=uint16), + mask=array([255], dtype=uint8), + band_names=['b1'], + coordinates=(10.20, -42), + crs=CRS.from_epsg(4326), + assets=['cog.tif'], + metadata={} + ) + + with Reader("cog.tif") as cog: + print(cog.point(10.20, -42.0)) + >>> PointData( + data=array([3744], dtype=uint16), + mask=array([255], dtype=uint8), + band_names=['b1'], + coordinates=(10.20, -42), + crs=CRS.from_epsg(4326), + assets=['cog.tif'], + metadata={} + ) + ``` + +* deleted `rio_tiler.reader.preview` function and updated `rio_tiler.reader.read` to allow width/height/max_size options +* reordered keyword options in all `rio_tiler.reader` function for consistency +* removed `AlphaBandWarning` warning when automatically excluding alpha band from data +* remove `nodata`, `unscale`, `resampling_method`, `vrt_options` and `post_process` options to `Reader` init method and replaced with `options` + ```python + # before + with COGReader("cog.tif", nodata=1, resampling_method="bilinear") as cog: + data = cog.preview() + + # now + with Reader(COGEO, options={"nodata": 1, "resampling_method": "bilinear"}) as cog: + data = cog.preview() + ``` + # 3.1.6 (2022-07-22) * Hide `NotGeoreferencedWarning` warnings in `utils.render` and `utils.resize_array` diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md index 602de440..f2c1e08d 100644 --- a/CONTRIBUTING.md +++ b/CONTRIBUTING.md @@ -56,8 +56,9 @@ pdocs as_markdown \ rio_tiler.expression \ rio_tiler.models \ rio_tiler.io.base \ - rio_tiler.io.cogeo \ + rio_tiler.io.rasterio \ rio_tiler.io.stac \ + rio_tiler.io.xarray \ rio_tiler.mosaic.methods.base \ rio_tiler.mosaic.methods.defaults \ rio_tiler.mosaic.reader \ diff --git a/README.md b/README.md index a86573e9..3d450bdf 100644 --- a/README.md +++ b/README.md @@ -47,16 +47,16 @@ data and metadata from any raster source supported by Rasterio/GDAL. This includes local and remote files via HTTP, AWS S3, Google Cloud Storage, etc. -At the low level, `rio-tiler` is *just* a wrapper around the [rasterio.vrt.WarpedVRT](https://github.com/rasterio/rasterio/blob/5b76d05fb374e64602166d6cd880c38424fad39b/rasterio/vrt.py#L15) class, which can be useful for doing re-projection and/or property overriding (e.g nodata value). +At the low level, `rio-tiler` is *just* a wrapper around the [rasterio](https://github.com/rasterio/rasterio) and [GDAL](https://github.com/osgeo/gdal) libraries. ## Features - Read any dataset supported by GDAL/Rasterio ```python - from rio_tiler.io import COGReader + from rio_tiler.io import Reader - with COGReader("my.tif") as image: + with Reader("my.tif") as image: print(image.dataset) # rasterio opened dataset img = image.read() # similar to rasterio.open("my.tif").read() but returns a rio_tiler.models.ImageData object ``` @@ -64,9 +64,9 @@ At the low level, `rio-tiler` is *just* a wrapper around the [rasterio.vrt.Warpe - User friendly `tile`, `part`, `feature`, `point` reading methods ```python - from rio_tiler.io import COGReader + from rio_tiler.io import Reader - with COGReader("my.tif") as image: + with Reader("my.tif") as image: img = image.tile(x, y, z) # read mercator tile z-x-y img = image.part(bbox) # read the data intersecting a bounding box img = image.feature(geojson_feature) # read the data intersecting a geojson feature @@ -76,9 +76,9 @@ At the low level, `rio-tiler` is *just* a wrapper around the [rasterio.vrt.Warpe - Enable property assignment (e.g nodata) on data reading ```python - from rio_tiler.io import COGReader + from rio_tiler.io import Reader - with COGReader("my.tif") as image: + with Reader("my.tif") as image: img = image.tile(x, y, z, nodata=-9999) # read mercator tile z-x-y ``` @@ -107,14 +107,46 @@ At the low level, `rio-tiler` is *just* a wrapper around the [rasterio.vrt.Warpe ) ``` +- [Xarray](https://xarray.dev) support **(>=4.0)** + + ```python + import xarray + from rio_tiler.io import XarrayReader + + ds = xarray.open_dataset( + "https://pangeo.blob.core.windows.net/pangeo-public/daymet-rio-tiler/na-wgs84.zarr/", + engine="zarr", + decode_coords="all", + consolidated=True, + ) + da = ds["tmax"] + with XarrayReader(da) as dst: + print(dst.info()) + img = dst.tile(1, 1, 2) + ``` + *Note: The XarrayReader needs optional dependencies to be installed `pip install rio-tiler["xarray"]`.* + +- Non-Geo Image support **(>=4.0)** + + ```python + from rio_tiler.io import ImageReader + + with ImageReader("image.jpeg") as src: + im = src.tile(0, 0, src.maxzoom) # read top-left `tile` + im = src.part((0, 100, 100, 0)) # read top-left 100x100 pixels + pt = src.point(0, 0) # read pixel value + ``` + + *Note: `ImageReader` is also compatible with proper geo-referenced raster datasets.* + - [Mosaic](https://cogeotiff.github.io/rio-tiler/mosaic/) (merging or stacking) ```python - from rio_tiler.io import COGReader + from rio_tiler.io import Reader from rio_tiler.mosaic import mosaic_reader def reader(file, x, y, z, **kwargs): - with COGReader(file) as image: + with Reader(file) as image: return image.tile(x, y, z, **kwargs) img, assets = mosaic_reader(["image1.tif", "image2.tif"], reader, x, y, z) @@ -124,11 +156,11 @@ At the low level, `rio-tiler` is *just* a wrapper around the [rasterio.vrt.Warpe ```python import morecantile - from rio_tiler.io import COGReader + from rio_tiler.io import Reader # Use EPSG:4326 (WGS84) grid wgs84_grid = morecantile.tms.get("WorldCRS84Quad") - with COGReader("my.tif", tms=wgs84_grid) as cog: + with Reader("my.tif", tms=wgs84_grid) as cog: img = cog.tile(1, 1, 1) ``` diff --git a/docs/mkdocs.yml b/docs/mkdocs.yml index 0289ac90..a269cc9d 100644 --- a/docs/mkdocs.yml +++ b/docs/mkdocs.yml @@ -51,8 +51,9 @@ nav: - rio_tiler.models: api/rio_tiler/models.md - rio_tiler.io: - rio_tiler.io.base: api/rio_tiler/io/base.md - - rio_tiler.io.cogeo: api/rio_tiler/io/cogeo.md + - rio_tiler.io.rasterio: api/rio_tiler/io/rasterio.md - rio_tiler.io.stac: api/rio_tiler/io/stac.md + - rio_tiler.io.xarray: api/rio_tiler/io/xarray.md - rio_tiler.mosaic: - rio_tiler.mosaic.reader: api/rio_tiler/mosaic/reader.md - rio_tiler.mosaic.methods: @@ -64,6 +65,7 @@ nav: - rio_tiler.utils: api/rio_tiler/utils.md - Migration from v1.0 to v2.0: 'v2_migration.md' - Migration from v2.0 to v3.0: 'v3_migration.md' + - Migration from v3.0 to v4.0: 'v4_migration.md' - Development - Contributing: 'contributing.md' - Release Notes: 'release-notes.md' diff --git a/docs/src/advanced/custom_readers.md b/docs/src/advanced/custom_readers.md index b105043d..2507909d 100644 --- a/docs/src/advanced/custom_readers.md +++ b/docs/src/advanced/custom_readers.md @@ -1,7 +1,7 @@ `rio-tiler` provides multiple [abstract base classes](https://docs.python.org/3.7/library/abc.html) from which it derives its -main readers: [`COGReader`](../readers.md#cogreader) and +main readers: [`Reader`](../readers.md#reader) and [`STACReader`](../readers.md#stacreader). You can also use these classes to build custom readers. @@ -16,8 +16,6 @@ Main `rio_tiler.io` Abstract Base Class. - **input**: Input - **tms**: The TileMatrixSet define which default projection and map grid the reader uses. Defaults to WebMercatorQuad. -- **minzoom**: Dataset's minzoom. Not in the `__init__` method. -- **maxzoom**: Dataset's maxzoom. Not in the `__init__` method. - **bounds**: Dataset's bounding box. Not in the `__init__` method. - **crs**: dataset's crs. Not in the `__init__` method. - **geographic_crs**: CRS to use as geographic coordinate system. Defaults to WGS84. Not in the `__init__` method. @@ -45,13 +43,7 @@ Abstract methods, are method that **HAVE TO** be implemented in the child class. - **point**: reads pixel value for a specific point (`List`) - **feature**: reads data for a geojson feature (`rio_tiler.models.ImageData`) -Example: [`COGReader`](../readers.md#cogreader) - -### **AsyncBaseReader** - -Equivalent of `BaseReader` for async-ready readers (e.g [aiocogeo](https://github.com/geospatial-jeff/aiocogeo)). The `AsyncBaseReader` has the same attributes/properties/methods as the `BaseReader`. - -see example of reader built using `AsyncBaseReader`: https://github.com/cogeotiff/rio-tiler/blob/832ecbd97f560c2764818bca30ca95ef25408527/tests/test_io_async.py#L49 +Example: [`Reader`](../readers.md#reader) ### **MultiBaseReader** @@ -69,7 +61,7 @@ from typing import Dict, Type import attr from morecantile import TileMatrixSet from rio_tiler.io.base import MultiBaseReader -from rio_tiler.io import COGReader, BaseReader +from rio_tiler.io import Reader, BaseReader from rio_tiler.constants import WEB_MERCATOR_TMS from rio_tiler.models import Info @@ -81,7 +73,7 @@ class AssetFileReader(MultiBaseReader): # because we add another attribute (prefix) we need to # re-specify the other attribute for the class - reader: Type[BaseReader] = attr.ib(default=COGReader) + reader: Type[BaseReader] = attr.ib(default=Reader) reader_options: Dict = attr.ib(factory=dict) tms: TileMatrixSet = attr.ib(default=WEB_MERCATOR_TMS) @@ -111,30 +103,30 @@ class AssetFileReader(MultiBaseReader): # we have a directoty with "scene_b1.tif", "scene_b2.tif" with AssetFileReader(input="my_dir/", prefix="scene_") as cr: print(cr.assets) - >>> ['b1', 'b2'] + >>> ['band1', 'band2'] - info = cr.info(assets=("b1", "b2")) + info = cr.info(assets=("band1", "band2")) # MultiBaseReader returns a Dict assert isinstance(info, dict) print(list(info)) - >>> ['b1', 'b2'] + >>> ['band1', 'band2'] - assert isinstance(info["b1"], Info) - print(info["b1"].json(exclude_none=True)) + assert isinstance(info["band1"], Info) + print(info["band1"].json(exclude_none=True)) >>> { 'bounds': [-11.979244865430259, 24.296321392464325, -10.874546803397614, 25.304623891542263], 'minzoom': 7, 'maxzoom': 9, - 'band_metadata': [('1', {})], - 'band_descriptions': [('1', '')], + 'band_metadata': [('b1', {})], + 'band_descriptions': [('b1', '')], 'dtype': 'uint16', 'nodata_type': 'Nodata', 'colorinterp': ['gray'] } - img = cr.tile(238, 218, 9, assets=("b1", "b2")) + img = cr.tile(238, 218, 9, assets=("band1", "band2")) print(img.assets) - >>> ['my_dir/scene_b1.tif', 'my_dir/scene_b2.tif'] + >>> ['my_dir/scene_band1.tif', 'my_dir/scene_band2.tif'] # Each assets have 1 bands, so when combining each img we get a (2, 256, 256) array. print(img.data.shape) @@ -199,24 +191,24 @@ class BandFileReader(MultiBandReader): # we have a directoty with "scene_b1.tif", "scene_b2.tif" with BandFileReader(input="my_dir/", prefix="scene_") as cr: print(cr.bands) - >>> ['b1', 'b2'] + >>> ['band1', 'band2'] - print(cr.info(bands=("b1", "b2")).json(exclude_none=True)) + print(cr.info(bands=("band1", "band2")).json(exclude_none=True)) >>> { 'bounds': [-11.979244865430259, 24.296321392464325, -10.874546803397614, 25.304623891542263], 'minzoom': 7, 'maxzoom': 9, - 'band_metadata': [('b1', {}), ('b2', {})], - 'band_descriptions': [('b1', ''), ('b2', '')], + 'band_metadata': [('band1', {}), ('band2', {})], + 'band_descriptions': [('band1', ''), ('band2', '')], 'dtype': 'uint16', 'nodata_type': 'Nodata', 'colorinterp': ['gray', 'gray'] } - img = cr.tile(238, 218, 9, bands=("b1", "b2")) + img = cr.tile(238, 218, 9, bands=("band1", "band2")) print(img.assets) - >>> ['my_dir/scene_b1.tif', 'my_dir/scene_b2.tif'] + >>> ['my_dir/scene_band1.tif', 'my_dir/scene_band2.tif'] print(img.data.shape) >>> (2, 256, 256) @@ -227,7 +219,7 @@ Note: [`rio-tiler-pds`][rio-tiler-pds] readers are built using the `MultiBandRea [rio-tiler-pds]: https://github.com/cogeotiff/rio-tiler-pds -## Custom COGReader subclass +## Custom Reader subclass The example :point_down: was created as a response to https://github.com/developmentseed/titiler/discussions/235. In short, the user needed a way to keep metadata information from an asset within a STAC item. @@ -239,12 +231,12 @@ But rio-tiler has been designed to be easily customizable. import attr from rasterio.io import DatasetReader from rio_tiler.io.stac import fetch, _to_pystac_item -from rio_tiler.io import COGReader +from rio_tiler.io import Reader import pystac @attr.s -class CustomSTACReader(COGReader): - """Custom COG Reader support.""" +class CustomSTACReader(Reader): + """Custom Reader support.""" # This will keep the STAC item info within the instance item: pystac.Item = attr.ib(default=None, init=False) @@ -279,7 +271,7 @@ In this `CustomSTACReader`, we are using a custom path `schema` in form of `{ite 1. Parse the input path to get the STAC url and asset name 2. Fetch and parse the STAC item 3. Construct a new `input` using the asset full url. -4. Fall back to the regular `COGReader` initialization (using `super().__attrs_post_init__()`) +4. Fall back to the regular `Reader` initialization (using `super().__attrs_post_init__()`) ## Simple Reader @@ -298,7 +290,7 @@ from morecantile import TileMatrixSet from rio_tiler.constants import BBox, WEB_MERCATOR_TMS @attr.s -class Reader(BaseReader): +class SimpleReader(BaseReader): input: DatasetReader = attr.ib() @@ -355,6 +347,6 @@ class Reader(BaseReader): ) with rasterio.open("file.tif") as src: - with Reader(src) as cog: + with SimpleReader(src) as cog: img = cog.tile(1, 1, 1) ``` diff --git a/docs/src/advanced/dynamic_tiler.md b/docs/src/advanced/dynamic_tiler.md index 8e6d5d2a..896de250 100644 --- a/docs/src/advanced/dynamic_tiler.md +++ b/docs/src/advanced/dynamic_tiler.md @@ -20,7 +20,7 @@ your own API. ### Requirements -- `rio-tiler ~= 3.0` +- `rio-tiler ~= 4.0` - `fastapi` - `uvicorn` @@ -49,7 +49,7 @@ from starlette.requests import Request from starlette.responses import Response from rio_tiler.profiles import img_profiles -from rio_tiler.io import COGReader +from rio_tiler.io import Reader app = FastAPI( @@ -75,7 +75,7 @@ def tile( url: str = Query(..., description="Cloud Optimized GeoTIFF URL."), ): """Handle tile requests.""" - with COGReader(url) as cog: + with Reader(url) as cog: img = cog.tile(x, y, z) content = img.render(img_format="PNG", **img_profiles.get("png")) return Response(content, media_type="image/png") @@ -90,7 +90,7 @@ def tilejson( tile_url = request.url_for("tile", {"z": "{z}", "x": "{x}", "y": "{y}"}) tile_url = f"{tile_url}?url={url}" - with COGReader(url) as cog: + with Reader(url) as cog: return { "bounds": cog.geographic_bounds, "minzoom": cog.minzoom, diff --git a/docs/src/advanced/feature.md b/docs/src/advanced/feature.md index 391151e5..98877862 100644 --- a/docs/src/advanced/feature.md +++ b/docs/src/advanced/feature.md @@ -1,12 +1,12 @@ ![](https://user-images.githubusercontent.com/10407788/105767632-3f959e80-5f29-11eb-9331-969f3f53111e.png) -Starting with `rio-tiler` v2, a `.feature()` method exists on `rio-tiler`'s readers (e.g `COGReader`) which enables data reading for GeoJSON defined (polygon or multipolygon) shapes. +Starting with `rio-tiler` v2, a `.feature()` method exists on `rio-tiler`'s readers (e.g `Reader`) which enables data reading for GeoJSON defined (polygon or multipolygon) shapes. ```python -from rio_tiler.io import COGReader +from rio_tiler.io import Reader from rio_tiler.models import ImageData -with COGReader("my-tif.tif") as cog: +with Reader("my-tif.tif") as cog: # Read data for a given geojson polygon img: ImageData = cog.feature(geojson_feature, max_size=1024) # we limit the max_size to 1024 ``` @@ -15,12 +15,12 @@ Under the hood, the `.feature` method uses `GDALWarpVRT`'s `cutline` option and the `.part()` method. The below process is roughly what `.feature` does for you. ```python -from rio_tiler.io import COGReader +from rio_tiler.io import Reader from rio_tiler.utils import create_cutline from rasterio.features import bounds as featureBounds -# Use COGReader to open and read the dataset -with COGReader("my_tif.tif") as cog: +# Use Reader to open and read the dataset +with Reader("my_tif.tif") as cog: # Create WTT Cutline cutline = create_cutline(cog.dataset, feat, geometry_crs="epsg:4326") @@ -36,8 +36,8 @@ Another interesting fact about the `cutline` option is that it can be used with ```python bbox = featureBounds(feat) -# Use COGReader to open and read the dataset -with COGReader("my_tif.tif") as cog: +# Use Reader to open and read the dataset +with Reader("my_tif.tif") as cog: # Create WTT Cutline cutline = create_cutline(cog.dataset, feat, geometry_crs="epsg:4326") diff --git a/docs/src/advanced/tms.md b/docs/src/advanced/tms.md index 8d4e6b72..0e29d34a 100644 --- a/docs/src/advanced/tms.md +++ b/docs/src/advanced/tms.md @@ -6,12 +6,12 @@ Starting with rio-tiler 2.0, we replaced [`mercantile`][mercantile] with [_`more ```python import morecantile -from rio_tiler.io import COGReader +from rio_tiler.io import Reader from rasterio.crs import CRS from pyproj import CRS as projCRS # By default we use WebMercator TMS -with COGReader("my.tif") as cog: +with Reader("my.tif") as cog: img = cog.tile(1, 1, 1) assert img.crs == CRS.from_epsg(3857) # default image output is the TMS crs (WebMercator) @@ -34,7 +34,7 @@ for name, tms in morecantile.tms.tms.items(): # Use EPSG:4326 (WGS84) grid wgs84_grid = morecantile.tms.get("WorldCRS84Quad") -with COGReader("my.tif", tms=wgs84_grid) as cog: +with Reader("my.tif", tms=wgs84_grid) as cog: img = cog.tile(1, 1, 1) assert img.crs == CRS.from_epsg(4326) @@ -43,7 +43,7 @@ extent = [-948.75, -543592.47, 5817.41, -3333128.95] # From https:///epsg.io/30 epsg3031TMS = morecantile.TileMatrixSet.custom( extent, projCRS.from_epsg(3031), identifier="MyCustomTmsEPSG3031" ) -with COGReader("my.tif", tms=epsg3031TMS) as cog: +with Reader("my.tif", tms=epsg3031TMS) as cog: img = cog.tile(1, 1, 1) assert img.crs == CRS.from_epsg(3031) ``` diff --git a/docs/src/advanced/zonal_stats.md b/docs/src/advanced/zonal_stats.md index 2ff5e911..39e33eb4 100644 --- a/docs/src/advanced/zonal_stats.md +++ b/docs/src/advanced/zonal_stats.md @@ -12,8 +12,8 @@ from rio_tiler.models import BandStatistics from geojson_pydantic.features import Feature, FeatureCollection from geojson_pydantic.geometries import Polygon -class COGReader(io.COGReader): - """Custom COGReader with zonal_statistics method.""" +class Reader(io.Reader): + """Custom Reader with zonal_statistics method.""" def zonal_statistics( self, @@ -49,7 +49,7 @@ class COGReader(io.COGReader): geojson = FeatureCollection(features=[geojson]) for feature in geojson: - # Get data overlapping with the feature (using COGReader.feature method) + # Get data overlapping with the feature (using Reader.feature method) data = self.feature( feature.dict(exclude_none=True), max_size=max_size, diff --git a/docs/src/colormap.md b/docs/src/colormap.md index 9799c63b..ffaf69e0 100644 --- a/docs/src/colormap.md +++ b/docs/src/colormap.md @@ -8,26 +8,25 @@ to `rio_tiler.utils.render`: ```python from rio_tiler.colormap import cmap -from rio_tiler.io import COGReader +from rio_tiler.io import Reader # Get Colormap # You can list available colormap names with `cmap.list()` cm = cmap.get("cfastie") -with COGReader( - "s3://landsat-pds/c1/L8/015/029/LC08_L1GT_015029_20200119_20200119_01_RT/LC08_L1GT_015029_20200119_20200119_01_RT_B8.TIF", - nodata=0, -) as cog: - img = cog.tile(150, 187, 9) +with Reader( + "https://sentinel-cogs.s3.amazonaws.com/sentinel-s2-l2a-cogs/29/R/KH/2020/2/S2A_29RKH_20200219_0_L2A/B01.tif", +) as src: + img = src.tile(239, 220, 9) # Rescale the data linearly from 0-10000 to 0-255 - image_rescale = img.post_process( + img.rescale( in_range=((0, 10000),), out_range=((0, 255),) ) # Apply colormap and create a PNG buffer - buff = image_rescale.render(colormap=cm) # this returns a buffer (PNG by default) + buff = img.render(colormap=cm) # this returns a buffer (PNG by default) ``` The `render` method accept colormap in form of: diff --git a/docs/src/examples/Using-nonEarth-dataset.ipynb b/docs/src/examples/Using-nonEarth-dataset.ipynb index 070abace..48e287cf 100644 --- a/docs/src/examples/Using-nonEarth-dataset.ipynb +++ b/docs/src/examples/Using-nonEarth-dataset.ipynb @@ -21,7 +21,7 @@ "# Requirements\n", "\n", "To be able to run this notebook you'll need the following requirements:\n", - "- rio-tiler~= 3.0\n", + "- rio-tiler~=4.0\n", "- ipyleaflet\n", "- matplotlib" ] @@ -44,14 +44,14 @@ "outputs": [], "source": [ "%pylab inline\n", - "from rio_tiler.io import COGReader\n", + "from rio_tiler.io import Reader\n", "\n", "# In order to fully work, we'll need to build a custom TileMatrixSet\n", "from morecantile import TileMatrixSet\n", "from pyproj import CRS\n", "\n", "# For this DEMO we will use this file\n", - "src_path = \"https://asc-jupiter.s3-us-west-2.amazonaws.com/europa/galileo_voyager/controlled_mosaics/11ESCOLORS01-02_GalileoSSI_Equi-cog.tif\"" + "src_path = \"https://raw.githubusercontent.com/cogeotiff/rio-tiler/master/tests/fixtures/cog_nonearth.tif\"" ] }, { @@ -60,12 +60,12 @@ "metadata": {}, "outputs": [], "source": [ - "\n", "# Let's first try with default\n", - "# We should see 2 different warnings here\n", - "# - UserWarning: Cannot dertermine min/max zoom based on dataset informations: We cannot get default Zooms in WebMercator projection\n", + "# We should see 3 different warnings here\n", "# - UserWarning: Cannot dertermine bounds in WGS84: There is no existing transformation to WGS84\n", - "with COGReader(src_path) as cog:\n", + "# - UserWarning: Cannot dertermine minzoom based on dataset informations: We cannot get default Zooms in WebMercator projection\n", + "# - UserWarning: Cannot dertermine maxzoom based on dataset informations: We cannot get default Zooms in WebMercator projection\n", + "with Reader(src_path) as cog:\n", " print(cog.info().json())" ] }, @@ -75,7 +75,6 @@ "metadata": {}, "outputs": [], "source": [ - "\n", "# Create a CUSTOM TMS using the europa ESRI:104915 projection\n", "europa_crs = CRS.from_authority(\"ESRI\", 104915)\n", "europa_tms = TileMatrixSet.custom(\n", @@ -85,8 +84,8 @@ "# Use Custom TMS instead of Web Mercator\n", "# We should see 2 different warnings here\n", "# - UserWarning: Could not create coordinate Transformer from input CRS to WGS84: This is from morecantile. It means some methods won't be available but we can ignore. \n", - "# - UserWarning: Cannot dertermine bounds in WGS84: Same as before. the `cog.geographic` property will return default (-180.0, -90.0, 180.0, 90.0)\n", - "with COGReader(src_path, tms=europa_tms) as cog:\n", + "# - UserWarning: Cannot dertermine bounds in WGS84: Same as before. the `cog.geographic_bounds` property will return default (-180.0, -90.0, 180.0, 90.0)\n", + "with Reader(src_path, tms=europa_tms) as cog:\n", " print(cog.info().json())\n", " img = cog.preview()\n", " imshow(img.data_as_image())" @@ -95,20 +94,22 @@ { "cell_type": "code", "execution_count": null, - "metadata": {}, + "metadata": { + "scrolled": false + }, "outputs": [], "source": [ "# Read a Tile\n", "from rasterio.warp import transform_bounds\n", "\n", - "with COGReader(src_path, tms=europa_tms) as cog:\n", + "with Reader(src_path, tms=europa_tms) as cog:\n", " # get dataset bounds in TMS's CRS projection\n", " bounds_in_tms = transform_bounds(cog.crs, europa_tms.rasterio_crs, *cog.bounds)\n", " tile = cog.tms._tile(bounds_in_tms[0], bounds_in_tms[1], cog.minzoom)\n", " print(tile)\n", "\n", " img = cog.tile(tile.x, tile.y, tile.z)\n", - " imshow(img.data_as_image())\n" + " imshow(img.data_as_image())" ] }, { @@ -150,7 +151,7 @@ "from tornado.httpserver import HTTPServer\n", "from tornado.concurrent import run_on_executor\n", "\n", - "from rio_tiler.io import COGReader\n", + "from rio_tiler.io import Reader\n", "from rio_tiler.errors import TileOutsideBounds\n", "from rio_tiler.profiles import img_profiles\n", "\n", @@ -195,7 +196,7 @@ " def _get_tile(self, z, x, y):\n", "\n", " try:\n", - " with COGReader(self.url, tms=europa_tms) as cog:\n", + " with Reader(self.url, tms=europa_tms) as cog:\n", " data = cog.tile(x, y, z)\n", " except TileOutsideBounds:\n", " raise web.HTTPError(404)\n", @@ -267,7 +268,7 @@ ], "metadata": { "kernelspec": { - "display_name": "Python 3", + "display_name": "Python 3 (ipykernel)", "language": "python", "name": "python3" }, @@ -281,7 +282,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.8.2" + "version": "3.9.13" } }, "nbformat": 4, diff --git a/docs/src/examples/Using-rio-tiler-STACReader.ipynb b/docs/src/examples/Using-rio-tiler-STACReader.ipynb index 43169315..6354400e 100644 --- a/docs/src/examples/Using-rio-tiler-STACReader.ipynb +++ b/docs/src/examples/Using-rio-tiler-STACReader.ipynb @@ -53,7 +53,7 @@ "source": [ "from rio_tiler.io import STACReader\n", "from rio_tiler.profiles import img_profiles\n", - "from rio_tiler.models import ImageData, Metadata" + "from rio_tiler.models import ImageData" ] }, { @@ -191,10 +191,10 @@ "source": [ "fig, axs = plt.subplots(1, 4, sharey=True, tight_layout=True, dpi=150)\n", "\n", - "axs[0].plot(meta[\"B01\"][\"1\"].histogram[1][0:-1], meta[\"B01\"][\"1\"].histogram[0])\n", - "axs[1].plot(meta[\"B02\"][\"1\"].histogram[1][0:-1], meta[\"B02\"][\"1\"].histogram[0])\n", - "axs[2].plot(meta[\"B03\"][\"1\"].histogram[1][0:-1], meta[\"B03\"][\"1\"].histogram[0])\n", - "axs[3].plot(meta[\"B04\"][\"1\"].histogram[1][0:-1], meta[\"B04\"][\"1\"].histogram[0])" + "axs[0].plot(meta[\"B01\"][\"b1\"].histogram[1][0:-1], meta[\"B01\"][\"b1\"].histogram[0])\n", + "axs[1].plot(meta[\"B02\"][\"b1\"].histogram[1][0:-1], meta[\"B02\"][\"b1\"].histogram[0])\n", + "axs[2].plot(meta[\"B03\"][\"b1\"].histogram[1][0:-1], meta[\"B03\"][\"b1\"].histogram[0])\n", + "axs[3].plot(meta[\"B04\"][\"b1\"].histogram[1][0:-1], meta[\"B04\"][\"b1\"].histogram[0])" ] }, { @@ -256,11 +256,12 @@ "outputs": [], "source": [ "# The sentinel data is stored as UInt16, we need to do some data rescaling to display data from 0 to 255\n", - "print(img.data.min(), img.data.max())\n", + "print(img.data.min(), img.data.max())x\n", + "\n", + "img.rescale(in_range=((0, 10000),))\n", + "print(img.min(), img.max())\n", "\n", - "image = img.post_process(in_range=((0, 10000),))\n", - "image = image.data_as_image()\n", - "print(image.min(), image.max())\n", + "image = img.data_as_image()\n", "imshow(image)" ] }, @@ -279,14 +280,16 @@ "source": [ "with STACReader(src_path) as stac:\n", " # By default `preview()` will return an array with its longest dimension lower or equal to 1024px\n", - " img = stac.preview(expression=\"(B08-B04)/(B08+B04)\", max_size=256)\n", + " img = stac.preview(expression=\"(B08_b1-B04_b1)/(B08_b1+B04_b1)\", max_size=256)\n", " print(img.data.shape)\n", " # learn more about the ImageData model https://cogeotiff.github.io/rio-tiler/models/#imagedata\n", " assert isinstance(img, ImageData)\n", "\n", "# NDVI data range should be between -1 and 1\n", - "image = img.post_process(in_range=((-1,1),))\n", - "image = image.data_as_image()\n", + "print(img.data.min(), img.data.max())\n", + "\n", + "img.rescale(in_range=((-1,1),))\n", + "image = img.data_as_image()\n", "imshow(image)" ] }, @@ -303,7 +306,8 @@ "hash": "e5a596c8625da0593f23bdd5ea51ce5c4572779fa5edc69fb6a18fc94feb7fb6" }, "kernelspec": { - "display_name": "Python 3.8.2 64-bit", + "display_name": "Python 3 (ipykernel)", + "language": "python", "name": "python3" }, "language_info": { @@ -316,7 +320,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.8.2" + "version": "3.9.13" } }, "nbformat": 4, diff --git a/docs/src/examples/Using-rio-tiler-XarrayReader.ipynb b/docs/src/examples/Using-rio-tiler-XarrayReader.ipynb new file mode 100644 index 00000000..0eb3085c --- /dev/null +++ b/docs/src/examples/Using-rio-tiler-XarrayReader.ipynb @@ -0,0 +1,972 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "id": "45bf509c", + "metadata": {}, + "outputs": [], + "source": [ + "import xarray\n", + "import matplotlib.pyplot as plt\n", + "\n", + "from rio_tiler.io.xarray import XarrayReader" + ] + }, + { + "cell_type": "markdown", + "id": "d2c1f9bd", + "metadata": {}, + "source": [ + "### daymet" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "feb70fe3", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "
<xarray.Dataset>\n",
+       "Dimensions:                  (time: 1, y: 3728, x: 17268)\n",
+       "Coordinates:\n",
+       "    lambert_conformal_conic  int64 0\n",
+       "  * time                     (time) datetime64[ns] 1980-07-01T12:00:00\n",
+       "  * x                        (x) float64 -180.0 -180.0 -179.9 ... 180.0 180.0\n",
+       "  * y                        (y) float64 83.78 83.76 83.74 ... 6.126 6.105 6.084\n",
+       "Data variables:\n",
+       "    tmax                     (time, y, x) float32 ...\n",
+       "Attributes:\n",
+       "    Conventions:       CF-1.6\n",
+       "    Version_data:      Daymet Data Version 4.0\n",
+       "    Version_software:  Daymet Software Version 4.0\n",
+       "    citation:          Please see http://daymet.ornl.gov/ for current Daymet ...\n",
+       "    references:        Please see http://daymet.ornl.gov/ for current informa...\n",
+       "    source:            Daymet Software Version 4.0\n",
+       "    start_year:        1980
" + ], + "text/plain": [ + "\n", + "Dimensions: (time: 1, y: 3728, x: 17268)\n", + "Coordinates:\n", + " lambert_conformal_conic int64 ...\n", + " * time (time) datetime64[ns] 1980-07-01T12:00:00\n", + " * x (x) float64 -180.0 -180.0 -179.9 ... 180.0 180.0\n", + " * y (y) float64 83.78 83.76 83.74 ... 6.126 6.105 6.084\n", + "Data variables:\n", + " tmax (time, y, x) float32 ...\n", + "Attributes:\n", + " Conventions: CF-1.6\n", + " Version_data: Daymet Data Version 4.0\n", + " Version_software: Daymet Software Version 4.0\n", + " citation: Please see http://daymet.ornl.gov/ for current Daymet ...\n", + " references: Please see http://daymet.ornl.gov/ for current informa...\n", + " source: Daymet Software Version 4.0\n", + " start_year: 1980" + ] + }, + "execution_count": 2, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "ds = xarray.open_dataset(\n", + " \"https://pangeo.blob.core.windows.net/pangeo-public/daymet-rio-tiler/na-wgs84.zarr/\",\n", + " engine=\"zarr\",\n", + " decode_coords=\"all\",\n", + " consolidated=True,\n", + ")\n", + "ds" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "cafd96de", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "
<xarray.DataArray 'tmax' (time: 1, y: 3728, x: 17268)>\n",
+       "[64375104 values with dtype=float32]\n",
+       "Coordinates:\n",
+       "    lambert_conformal_conic  int64 0\n",
+       "  * time                     (time) datetime64[ns] 1980-07-01T12:00:00\n",
+       "  * x                        (x) float64 -180.0 -180.0 -179.9 ... 180.0 180.0\n",
+       "  * y                        (y) float64 83.78 83.76 83.74 ... 6.126 6.105 6.084\n",
+       "Attributes:\n",
+       "    cell_methods:  area: mean time: maximum within days time: mean over days\n",
+       "    coordinates:   lon lat\n",
+       "    long_name:     annual average of daily maximum temperature\n",
+       "    units:         degrees C
" + ], + "text/plain": [ + "\n", + "[64375104 values with dtype=float32]\n", + "Coordinates:\n", + " lambert_conformal_conic int64 0\n", + " * time (time) datetime64[ns] 1980-07-01T12:00:00\n", + " * x (x) float64 -180.0 -180.0 -179.9 ... 180.0 180.0\n", + " * y (y) float64 83.78 83.76 83.74 ... 6.126 6.105 6.084\n", + "Attributes:\n", + " cell_methods: area: mean time: maximum within days time: mean over days\n", + " coordinates: lon lat\n", + " long_name: annual average of daily maximum temperature\n", + " units: degrees C" + ] + }, + "execution_count": 3, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "da = ds[\"tmax\"]\n", + "da" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "d29e0c33", + "metadata": { + "scrolled": true + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "bounds=BoundingBox(left=-179.99998449579846, bottom=6.073484821356791, right=179.98170598363066, top=83.79467217916716) minzoom=1 maxzoom=6 band_metadata=[('b1', {'long_name': '24-hour day based on local time', 'standard_name': 'time'})] band_descriptions=[('b1', '1980-07-01T12:00:00.000000000')] dtype='float32' nodata_type='Nodata' colorinterp=None scale=None offset=None colormap=None attrs={'cell_methods': 'area: mean time: maximum within days time: mean over days', 'coordinates': 'lon lat', 'long_name': 'annual average of daily maximum temperature', 'units': 'degrees C'} height=3728 count=1 name='tmax' width=17268\n" + ] + } + ], + "source": [ + "da = ds[\"tmax\"]\n", + "with XarrayReader(da) as dst:\n", + " print(dst.info())" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "id": "93d11d9c", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "with XarrayReader(da) as dst:\n", + " img = dst.tile(1, 1, 2)\n", + "\n", + "plt.imshow(img.data_as_image());" + ] + }, + { + "cell_type": "markdown", + "id": "1c538213", + "metadata": {}, + "source": [ + "### noaa-coastwatch-geopolar-sst" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "id": "8f90e288", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "bounds=BoundingBox(left=-180.00000610436345, bottom=-89.99999847369712, right=180.00000610436345, top=89.99999847369712) minzoom=0 maxzoom=2 band_metadata=[('b1', {'axis': 'T', 'comment': 'Nominal time of Level 4 analysis', 'long_name': 'reference time of sst field', 'standard_name': 'time'})] band_descriptions=[('b1', '2002-09-01T12:00:00.000000000')] dtype='float32' nodata_type='Nodata' colorinterp=None scale=None offset=None colormap=None attrs={'comment': 'Analysed SST for each ocean grid point', 'long_name': 'analysed sea surface temperature', 'reference': 'Fieguth,P.W. et al. \"Mapping Mediterranean altimeter data with a multiresolution optimal interpolation algorithm\", J. Atmos. Ocean Tech, 15 (2): 535-546, 1998. Fieguth, P. Multiply-Rooted Multiscale Models for Large-Scale Estimation, IEEE Image Processing, 10(11), 1676-1686, 2001. Khellah, F., P.W. Fieguth, M.J. Murray and M.R. Allen, \"Statistical Processing of Large Image Sequences\", IEEE Transactions on Geoscience and Remote Sensing, 12 (1), 80-93, 2005. Maturi, E., A. Harris, J. Mittaz, J. Sapper, G. Wick, X. Zhu, P. Dash, P. Koner, \"A New High-Resolution Sea Surface Temperature Blended Analysis\", Bulleting of the American Meteorological Society, 98 (5), 1015-1026, 2017.', 'source': 'STAR-ACSPO_GAC, STAR-ACSPO_H-8, STAR-Geo_SST, UKMO-OSTIA', 'standard_name': 'sea_surface_foundation_temperature', 'units': 'kelvin', 'valid_max': 4000, 'valid_min': -200} height=3600 count=1 name='analysed_sst' width=7200\n" + ] + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "with xarray.open_dataset(\n", + " \"https://ncsa.osn.xsede.org/Pangeo/pangeo-forge/noaa-coastwatch-geopolar-sst-feedstock/noaa-coastwatch-geopolar-sst.zarr\",\n", + " engine=\"zarr\",\n", + " decode_coords=\"all\"\n", + ") as src:\n", + " \n", + " ds = src[\"analysed_sst\"][:1]\n", + " \n", + " # the SST dataset do not have a CRS info\n", + " # so we need to add it to `virtualy` within the Xarray DataArray\n", + " ds.rio.write_crs(\"epsg:4326\", inplace=True)\n", + " \n", + " with XarrayReader(ds) as dst:\n", + " print(dst.info())\n", + " img = dst.tile(1, 1, 2)\n", + "\n", + " plt.imshow(img.data_as_image())" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "b4c3f03f", + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "py39", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.9.13" + }, + "vscode": { + "interpreter": { + "hash": "2590a9e34ee6c8bdce5141410f2a072bbabd2a859a8a48acdaa85720923a90ef" + } + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/docs/src/examples/Using-rio-tiler-mosaic.ipynb b/docs/src/examples/Using-rio-tiler-mosaic.ipynb index 00732e40..ce25ebe0 100755 --- a/docs/src/examples/Using-rio-tiler-mosaic.ipynb +++ b/docs/src/examples/Using-rio-tiler-mosaic.ipynb @@ -35,12 +35,12 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "# Requirements\n", + "#### Requirements\n", "\n", "To be able to run this notebook you'll need the following requirements:\n", "- rasterio\n", "- ipyleaflet\n", - "- rio-tiler~= 3.0" + "- rio-tiler~= 4.0" ] }, { @@ -65,7 +65,7 @@ "\n", "import morecantile\n", "\n", - "from rio_tiler.io import COGReader, STACReader\n", + "from rio_tiler.io import Reader, STACReader\n", "from rio_tiler.mosaic import mosaic_reader\n", "from rio_tiler.mosaic.methods import defaults\n", "from rio_tiler.mosaic.methods.base import MosaicMethodBase\n", @@ -269,7 +269,7 @@ "outputs": [], "source": [ "def tiler(asset, *args, **kwargs):\n", - " with COGReader(asset) as cog:\n", + " with Reader(asset) as cog:\n", " return cog.tile(*args, **kwargs)" ] }, @@ -423,7 +423,7 @@ "# Because we need to use multiple STAC assets, it's easier to use the STACReader\n", "def custom_tiler(asset, *args, **kwargs):\n", " with STACReader(asset) as stac:\n", - " return stac.tile(*args, expression=\"(B08-B04)/(B08+B04)\")\n", + " return stac.tile(*args, expression=\"(B08_b1-B04_b1)/(B08_b1+B04_b1)\")\n", "\n", "tile = tiles[0]\n", "\n", @@ -465,7 +465,7 @@ "def custom_tiler(asset, *args, **kwargs):\n", " with STACReader(asset) as stac:\n", " img = stac.tile(*args, assets=\"visual\")\n", - " ndvi = stac.tile(*args, expression=\"(B08-B04)/(B08+B04)\")\n", + " ndvi = stac.tile(*args, expression=\"(B08_b1-B04_b1)/(B08_b1+B04_b1)\")\n", " return ImageData(numpy.concatenate((img.data, ndvi.data)), img.mask, crs=img.crs, bounds=img.bounds)" ] }, @@ -552,7 +552,7 @@ ], "metadata": { "kernelspec": { - "display_name": "Python 3", + "display_name": "Python 3 (ipykernel)", "language": "python", "name": "python3" }, @@ -566,7 +566,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.8.2" + "version": "3.9.13" } }, "nbformat": 4, diff --git a/docs/src/examples/Using-rio-tiler.ipynb b/docs/src/examples/Using-rio-tiler.ipynb index 472f8bcd..d7cfd44f 100644 --- a/docs/src/examples/Using-rio-tiler.ipynb +++ b/docs/src/examples/Using-rio-tiler.ipynb @@ -33,7 +33,7 @@ "# Requirements\n", "\n", "To be able to run this notebook you'll need the following requirements:\n", - "- rio-tiler~= 3.0" + "- rio-tiler~= 4.0" ] }, { @@ -52,7 +52,7 @@ "outputs": [], "source": [ "import morecantile\n", - "from rio_tiler.io import COGReader\n", + "from rio_tiler.io import Reader\n", "from rio_tiler.profiles import img_profiles\n", "from rio_tiler.models import ImageData" ] @@ -61,14 +61,7 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "## Data\n", - "\n", - "For this demo we will use some NAIP data hosted on Azure.\n", - "\n", - "https://azure.microsoft.com/fr-fr/services/open-datasets/catalog/naip/\n", - "\n", - "\n", - "The data is similar to the data hosted on [AWS](https://registry.opendata.aws/naip/), but using the one on Azure is easier because it offers direct `http` access without needing an AWS account." + "\n" ] }, { @@ -78,7 +71,7 @@ "outputs": [], "source": [ "# For this DEMO we will use this file\n", - "src_path = \"https://naipblobs.blob.core.windows.net/naip/v002/al/2019/al_60cm_2019/30087/m_3008701_ne_16_060_20191115.tif\"" + "src_path = \"https://data.geo.admin.ch/ch.swisstopo.swissalti3d/swissalti3d_2019_2573-1085/swissalti3d_2019_2573-1085_0.5_2056_5728.tif\"" ] }, { @@ -87,7 +80,7 @@ "source": [ "## rio_tiler.io.COGReader\n", "\n", - "In `rio-tiler` 2.0 we introduced COGReader, which is a python class providing usefull methods to read and inspect any GDAL/rasterio raster dataset.\n", + "In `rio-tiler` 2.0 we introduced COGReader (renamed Reader in 4.0), which is a python class providing usefull methods to read and inspect any GDAL/rasterio raster dataset.\n", "\n", "Docs: [https://cogeotiff.github.io/rio-tiler/readers/#cogreader](https://cogeotiff.github.io/rio-tiler/readers/#cogreader) " ] @@ -98,7 +91,7 @@ "metadata": {}, "outputs": [], "source": [ - "?COGReader" + "?Reader" ] }, { @@ -120,7 +113,7 @@ "source": [ "# As for Rasterio, using context manager is a good way to \n", "# make sure the dataset are closed when we exit.\n", - "with COGReader(src_path) as cog:\n", + "with Reader(src_path) as cog:\n", " print(\"rasterio dataset:\")\n", " print(cog.dataset)\n", " print()\n", @@ -152,12 +145,12 @@ }, "outputs": [], "source": [ - "with COGReader(src_path) as cog:\n", + "with Reader(src_path) as cog:\n", " meta = cog.statistics(max_size=256)\n", "\n", " assert isinstance(meta, dict)\n", " print(list(meta))\n", - " print(meta[\"1\"].dict())" + " print(meta[\"b1\"].dict())" ] }, { @@ -173,18 +166,8 @@ "metadata": {}, "outputs": [], "source": [ - "fig, axs = plt.subplots(1, 4, sharey=True, tight_layout=True, dpi=150)\n", - "# Red (index 1)\n", - "axs[0].plot(meta[\"1\"].histogram[1][0:-1], meta[\"1\"].histogram[0])\n", - "\n", - "# Green (index 2)\n", - "axs[1].plot(meta[\"2\"].histogram[1][0:-1], meta[\"2\"].histogram[0])\n", - "\n", - "# Blue (index 3)\n", - "axs[2].plot(meta[\"3\"].histogram[1][0:-1], meta[\"3\"].histogram[0])\n", - "\n", - "# NIR (index 4)\n", - "axs[3].plot(meta[\"4\"].histogram[1][0:-1], meta[\"4\"].histogram[0])" + "# Band 1\n", + "plot(meta[\"b1\"].histogram[1][0:-1], meta[\"b1\"].histogram[0])" ] }, { @@ -202,7 +185,7 @@ "metadata": {}, "outputs": [], "source": [ - "with COGReader(src_path) as cog:\n", + "with Reader(src_path) as cog:\n", " # By default `preview()` will return an array with its longest dimension lower or equal to 1024px\n", " data = cog.preview()\n", " print(data.data.shape)\n", @@ -228,14 +211,17 @@ }, "outputs": [], "source": [ - "print(f\"width: {img.width}\")\n", - "print(f\"height: {img.height}\")\n", - "print(f\"bands: {img.count}\")\n", - "print(f\"crs: {img.crs}\")\n", - "print(f\"bounds: {img.bounds}\")\n", + "print(f\"width: {data.width}\")\n", + "print(f\"height: {data.height}\")\n", + "print(f\"bands: {data.count}\")\n", + "print(f\"crs: {data.crs}\")\n", + "print(f\"bounds: {data.bounds}\")\n", + "print(f\"metadata: {data.metadata}\")\n", + "print(f\"assets: {data.assets}\")\n", + "print(f\"dataset stats: {data.dataset_statistics}\") # If stored in the original dataset\n", "\n", - "print(type(img.data))\n", - "print(type(img.mask))" + "print(type(data.data))\n", + "print(type(data.mask))" ] }, { @@ -248,22 +234,54 @@ { "cell_type": "code", "execution_count": null, - "metadata": {}, + "metadata": { + "scrolled": false + }, "outputs": [], "source": [ "# Rasterio doesn't use the same axis order than visualization libraries (e.g matplotlib, PIL)\n", "# in order to display the data we need to change the order (using rasterio.plot.array_to_image).\n", "# the ImageData class wraps the rasterio function in the `data_as_image()` method.\n", - "print(type(img))\n", - "print(img.data.shape)\n", + "print(type(data))\n", + "print(data.data.shape)\n", "\n", - "image = img.data_as_image()\n", + "image = data.data_as_image()\n", "# data_as_image() returns a numpy.ndarray\n", "print(type(image))\n", "print(image.shape)\n", "\n", - "# Use only the first 3 bands (RGB)\n", - "imshow(image[:,:,0:3])" + "imshow(image)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Multi Spectral Data\n", + "\n", + "For this demo we will use some High resolution RGB-Nir data hosted on [AWS](https://registry.opendata.aws/nj-imagery/).\n", + "\n" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "src_path = \"https://njogis-imagery.s3.amazonaws.com/2020/cog/I7D16.tif\"" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "with Reader(src_path) as cog:\n", + " info = cog.info()\n", + " print(\"rio-tiler dataset info:\")\n", + " print(cog.info().dict(exclude_none=True))" ] }, { @@ -272,9 +290,23 @@ "metadata": {}, "outputs": [], "source": [ - "# Display NRG image\n", - "# The NAIP imagery has 4 bands Red, Green, Blue, NIR\n", - "imshow(image[:,:,[3,0,1]])" + "with Reader(src_path) as cog:\n", + " meta = cog.statistics()\n", + "\n", + "print(list(meta))\n", + " \n", + "fig, axs = plt.subplots(1, 4, sharey=True, tight_layout=True, dpi=150)\n", + "# Red (index 1)\n", + "axs[0].plot(meta[\"b1\"].histogram[1][0:-1], meta[\"b1\"].histogram[0])\n", + "\n", + "# Green (index 2)\n", + "axs[1].plot(meta[\"b2\"].histogram[1][0:-1], meta[\"b2\"].histogram[0])\n", + "\n", + "# Blue (index 3)\n", + "axs[2].plot(meta[\"b3\"].histogram[1][0:-1], meta[\"b3\"].histogram[0])\n", + "\n", + "# Nir (index 3)\n", + "axs[3].plot(meta[\"b4\"].histogram[1][0:-1], meta[\"b4\"].histogram[0])" ] }, { @@ -292,11 +324,13 @@ "metadata": {}, "outputs": [], "source": [ - "with COGReader(src_path) as cog:\n", - " # Return only the last band\n", + "with Reader(src_path) as cog:\n", + " # Return only the third band\n", " nir_band = cog.preview(indexes=4)\n", " print(nir_band.data.shape)\n", - " print(nir_band.data.dtype)" + " print(nir_band.data.dtype)\n", + "\n", + "imshow(nir_band.data_as_image())" ] }, { @@ -305,7 +339,23 @@ "metadata": {}, "outputs": [], "source": [ - "with COGReader(src_path) as cog:\n", + "with Reader(src_path) as cog:\n", + " # Return only the third band\n", + " nrg = cog.preview(indexes=(4,3,1))\n", + " \n", + " # Data is in Uint16 so we need to rescale\n", + " nrg.rescale(((nrg.data.min(), nrg.data.max()),))\n", + "\n", + "imshow(nrg.data_as_image())" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "with Reader(src_path) as cog:\n", " # Apply NDVI band math\n", " # (NIR - RED) / (NIR + RED)\n", " ndvi = cog.preview(expression=\"(b4-b1)/(b4+b1)\")\n", @@ -313,8 +363,8 @@ " print(ndvi.data.dtype)\n", " print(\"NDVI range: \", ndvi.data.min(), ndvi.data.max())\n", "\n", - "image = ndvi.post_process(in_range=((-1,1),))\n", - "imshow(image.data[0])" + "ndvi.rescale(in_range=((-1,1),))\n", + "imshow(ndvi.data_as_image())" ] }, { @@ -332,7 +382,7 @@ "metadata": {}, "outputs": [], "source": [ - "with COGReader(src_path) as cog:\n", + "with Reader(src_path) as cog:\n", " print(f\"Bounds in dataset CRS: {cog.bounds}\")\n", " print(f\"Bounds WGS84: {cog.geographic_bounds}\")\n", " print(f\"MinZoom (WebMercator): {cog.minzoom}\")\n", @@ -351,7 +401,7 @@ "print(repr(tms))\n", "\n", "# Get the list of tiles for the COG minzoom \n", - "with COGReader(src_path) as cog:\n", + "with Reader(src_path) as cog:\n", " tile_cover = list(tms.tiles(*cog.geographic_bounds, zooms=cog.minzoom))\n", "\n", "print(f\"Nb of Z{cog.minzoom} Mercator tiles: {len(tile_cover)}\")\n", @@ -364,11 +414,14 @@ "metadata": {}, "outputs": [], "source": [ - "with COGReader(src_path) as cog:\n", + "with Reader(src_path) as cog:\n", " img_1 = cog.tile(*tile_cover[0])\n", + " img_1.rescale(((0, 40000),))\n", " print(img_1.data.shape)\n", "\n", " img_2 = cog.tile(*tile_cover[1])\n", + " img_2.rescale(((0, 40000),))\n", + "\n", " print(img_2.data.shape)" ] }, @@ -396,12 +449,12 @@ "metadata": {}, "outputs": [], "source": [ - "with COGReader(src_path) as cog:\n", + "with Reader(src_path) as cog:\n", " ndvi = cog.tile(*tile_cover[0], expression=\"(b4-b1)/(b4+b1)\")\n", " print(ndvi.data.shape)\n", "\n", - "image = ndvi.post_process(in_range=((-1,1),))\n", - "imshow(image.data[0])" + "ndvi.rescale(in_range=((-1,1),))\n", + "imshow(ndvi.data[0])" ] }, { @@ -419,9 +472,9 @@ "metadata": {}, "outputs": [], "source": [ - "with COGReader(src_path) as cog:\n", + "with Reader(src_path) as cog:\n", " # By default `part()` will read the highest resolution. We can limit this by using the `max_size` option.\n", - " img = cog.part((-87.92238235473633, 30.954131465929947, -87.87843704223633, 30.97996389724008), max_size=1024)\n", + " img = cog.part((-74.30680274963379, 40.60748547709819, -74.29478645324707, 40.61567903099978), max_size=1024)\n", " print(img.data.shape)\n", " print(img.bounds)\n", " print(img.crs)" @@ -433,6 +486,8 @@ "metadata": {}, "outputs": [], "source": [ + "img.rescale(((0, 40000),))\n", + "\n", "imshow(img.data_as_image()[:,:,0:3])" ] }, @@ -451,8 +506,8 @@ "metadata": {}, "outputs": [], "source": [ - "with COGReader(src_path) as cog:\n", - " values = cog.point(-87.92238235473633, 30.954131465929947)\n", + "with Reader(src_path) as cog:\n", + " values = cog.point(-74.30680274963379, 40.60748547709819)\n", "print(values)" ] }, @@ -471,7 +526,61 @@ "metadata": {}, "outputs": [], "source": [ - "feat = {\"type\":\"Feature\",\"properties\":{},\"geometry\":{\"type\":\"Polygon\",\"coordinates\":[[[-87.91989326477051,30.977388327504983],[-87.92341232299805,30.9747390975502],[-87.92015075683594,30.97282571907513],[-87.91723251342773,30.971869015455276],[-87.9192066192627,30.96914603729001],[-87.92032241821289,30.965466213678003],[-87.91869163513184,30.960093416531947],[-87.91577339172363,30.957885330068873],[-87.91028022766113,30.95700208119036],[-87.90839195251465,30.955971613842785],[-87.91105270385741,30.954646710918635],[-87.91508674621582,30.954793923262105],[-87.92135238647461,30.953321789618688],[-87.92126655578612,30.947506639952913],[-87.92324066162108,30.94353152388283],[-87.9224681854248,30.9393353886492],[-87.92109489440918,30.936832343075928],[-87.92075157165527,30.9326359137502],[-87.91646003723145,30.934034743992026],[-87.91534423828124,30.937494920341457],[-87.91611671447754,30.941764752554082],[-87.91053771972656,30.943973211611713],[-87.91414260864258,30.948242754412334],[-87.91671752929688,30.949862186261473],[-87.91191101074219,30.949494135978654],[-87.90899276733398,30.950377454275596],[-87.90349960327147,30.95045106376507],[-87.90298461914062,30.953174575006617],[-87.89912223815918,30.953763432093723],[-87.89543151855469,30.953027360167685],[-87.89122581481934,30.955529981576515],[-87.89551734924316,30.959651803323208],[-87.89912223815918,30.960903035444577],[-87.90238380432129,30.95979900795299],[-87.90633201599121,30.96053502769875],[-87.9082202911377,30.963479049959364],[-87.91345596313477,30.964877428739207],[-87.91259765625,30.967306143211744],[-87.9085636138916,30.965466213678003],[-87.90547370910643,30.96553981154008],[-87.90667533874512,30.96885165662014],[-87.90684700012207,30.97039714501039],[-87.89517402648926,30.972972903396382],[-87.89328575134277,30.97643166961476],[-87.8957748413086,30.979080852589725],[-87.89852142333984,30.977093972252376],[-87.90006637573242,30.97643166961476],[-87.9019546508789,30.978712914907245],[-87.90633201599121,30.97805062350409],[-87.90461540222168,30.975107050552193],[-87.90521621704102,30.97422396096446],[-87.90796279907227,30.976358080149122],[-87.90976524353026,30.976063721719164],[-87.90907859802245,30.973856004558257],[-87.9111385345459,30.974076778572197],[-87.91379928588867,30.975769362381378],[-87.9177474975586,30.97643166961476],[-87.91929244995116,30.977314738776947],[-87.91989326477051,30.977388327504983]]]}}" + "feat = {\n", + " \"type\": \"Feature\",\n", + " \"properties\": {},\n", + " \"geometry\": {\n", + " \"type\": \"Polygon\",\n", + " \"coordinates\": [\n", + " [\n", + " [\n", + " -74.30384159088135,\n", + " 40.614245638811646\n", + " ],\n", + " [\n", + " -74.30680274963379,\n", + " 40.61121586776988\n", + " ],\n", + " [\n", + " -74.30590152740477,\n", + " 40.608967884350946\n", + " ],\n", + " [\n", + " -74.30272579193115,\n", + " 40.60748547709819\n", + " ],\n", + " [\n", + " -74.29875612258911,\n", + " 40.60786015456402\n", + " ],\n", + " [\n", + " -74.2960524559021,\n", + " 40.61012446497514\n", + " ],\n", + " [\n", + " -74.29478645324707,\n", + " 40.61390357476733\n", + " ],\n", + " [\n", + " -74.29882049560547,\n", + " 40.61515780103489\n", + " ],\n", + " [\n", + " -74.30294036865233,\n", + " 40.61567903099978\n", + " ],\n", + " [\n", + " -74.3035626411438,\n", + " 40.61502749290829\n", + " ],\n", + " [\n", + " -74.30384159088135,\n", + " 40.614245638811646\n", + " ]\n", + " ]\n", + " ]\n", + " }\n", + "}" ] }, { @@ -480,7 +589,7 @@ "metadata": {}, "outputs": [], "source": [ - "with COGReader(src_path) as cog:\n", + "with Reader(src_path) as cog:\n", " # we use the feature to define the bounds and the mask\n", " # but we use `dst_crs` options to keep the projection from the input dataset\n", " # By default `feature()` will read the highest resolution. We can limit this by using the `max_size` option.\n", @@ -498,15 +607,9 @@ }, "outputs": [], "source": [ + "img.rescale(((0, 40000),))\n", "imshow(img.data_as_image()[:,:,0:3])" ] - }, - { - "cell_type": "code", - "execution_count": null, - "metadata": {}, - "outputs": [], - "source": [] } ], "metadata": { @@ -514,7 +617,8 @@ "hash": "e5a596c8625da0593f23bdd5ea51ce5c4572779fa5edc69fb6a18fc94feb7fb6" }, "kernelspec": { - "display_name": "Python 3.8.2 64-bit", + "display_name": "Python 3 (ipykernel)", + "language": "python", "name": "python3" }, "language_info": { @@ -527,7 +631,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.8.2" + "version": "3.9.13" } }, "nbformat": 4, diff --git a/docs/src/examples/Using-tms.ipynb b/docs/src/examples/Using-tms.ipynb index 7e88260c..5cb3a94e 100644 --- a/docs/src/examples/Using-tms.ipynb +++ b/docs/src/examples/Using-tms.ipynb @@ -21,13 +21,13 @@ "# Requirements\n", "\n", "To be able to run this notebook you'll need the following requirements:\n", - "- rio-tiler~= 3.0\n", + "- rio-tiler~= 4.0\n", "- ipyleaflet" ] }, { "cell_type": "code", - "execution_count": null, + "execution_count": 2, "metadata": {}, "outputs": [], "source": [ @@ -37,7 +37,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 3, "metadata": {}, "outputs": [], "source": [ @@ -59,22 +59,17 @@ "source": [ "## Data\n", "\n", - "For this demo we will use some NAIP data hosted on Azure.\n", - "\n", - "https://azure.microsoft.com/fr-fr/services/open-datasets/catalog/naip/\n", - "\n", - "\n", - "The data is similar to the data hosted on [AWS](https://registry.opendata.aws/naip/), but using the one on Azure is easier because it offers direct `http` access without needing an AWS account." + "For this demo we will use some High resolution RGB-Nir data hosted on [AWS](https://registry.opendata.aws/nj-imagery/)." ] }, { "cell_type": "code", - "execution_count": null, + "execution_count": 4, "metadata": {}, "outputs": [], "source": [ "# For this DEMO we will use this file\n", - "src_path = \"https://naipblobs.blob.core.windows.net/naip/v002/al/2019/al_60cm_2019/30087/m_3008701_ne_16_060_20191115.tif\"" + "src_path = \"https://njogis-imagery.s3.amazonaws.com/2020/cog/I7D16.tif\"" ] }, { @@ -88,7 +83,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 5, "metadata": {}, "outputs": [], "source": [ @@ -100,7 +95,7 @@ "from tornado.httpserver import HTTPServer\n", "from tornado.concurrent import run_on_executor\n", "\n", - "from rio_tiler.io import COGReader\n", + "from rio_tiler.io import Reader\n", "from rio_tiler.errors import TileOutsideBounds\n", "from rio_tiler.profiles import img_profiles\n", "\n", @@ -137,7 +132,7 @@ " def _get_tile(self, tms, z, x, y):\n", "\n", " try:\n", - " with COGReader(self.url, tms=morecantile.tms.get(tms)) as cog:\n", + " with Reader(self.url, tms=morecantile.tms.get(tms)) as cog:\n", " img = cog.tile(x, y, z, indexes=(1,2,3))\n", " except TileOutsideBounds:\n", " raise web.HTTPError(404)\n", @@ -169,11 +164,31 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 6, "metadata": { "scrolled": false }, - "outputs": [], + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Supported TMS:\n", + "- LINZAntarticaMapTilegrid | urn:ogc:def:crs:EPSG::5482\n", + "- EuropeanETRS89_LAEAQuad | urn:ogc:def:crs:EPSG::3035\n", + "- CanadianNAD83_LCC | urn:ogc:def:crs:EPSG::3978\n", + "- UPSArcticWGS84Quad | urn:ogc:def:crs:EPSG::5041\n", + "- NZTM2000 | urn:ogc:def:crs:EPSG::2193\n", + "- NZTM2000Quad | urn:ogc:def:crs:EPSG::2193\n", + "- UTM31WGS84Quad | urn:ogc:def:crs:EPSG::32631\n", + "- UPSAntarcticWGS84Quad | urn:ogc:def:crs:EPSG::5042\n", + "- WorldMercatorWGS84Quad | urn:ogc:def:crs:EPSG::3395\n", + "- WGS1984Quad | urn:ogc:def:crs:EPSG::4326\n", + "- WorldCRS84Quad | urn:ogc:def:crs:OGC::CRS84\n", + "- WebMercatorQuad | urn:ogc:def:crs:EPSG::3857\n" + ] + } + ], "source": [ "print(\"Supported TMS:\")\n", "for name, tms in morecantile.tms.tms.items():\n", @@ -189,15 +204,41 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 9, "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "{'bounds': BoundingBox(left=-74.3095632062702, bottom=40.603994417539994, right=-74.29151245384847, top=40.61775082944064), 'minzoom': 14, 'maxzoom': 19, 'band_metadata': [('b1', {}), ('b2', {}), ('b3', {}), ('b4', {})], 'band_descriptions': [('b1', ''), ('b2', ''), ('b3', ''), ('b4', '')], 'dtype': 'uint16', 'nodata_type': 'None', 'colorinterp': ['red', 'green', 'blue', 'undefined'], 'driver': 'GTiff', 'count': 4, 'overviews': [2, 4, 8, 16], 'width': 5000, 'height': 5000}\n" + ] + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "7b640ef0c2b34a37902653915778514d", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "Map(center=[40.610872623490316, -74.30053783005934], controls=(ZoomControl(options=['position', 'zoom_in_text'…" + ] + }, + "execution_count": 9, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ - "with COGReader(src_path) as cog:\n", + "with Reader(src_path) as cog:\n", " info = cog.info()\n", + " \n", "print(info.dict(exclude_none=True))\n", "\n", - "m = Map(center=(30.96, -87.90), zoom=info.minzoom, basemap={})\n", + "bounds = info.bounds\n", + "center = ((bounds[1] + bounds[3]) / 2, (bounds[0] + bounds[2]) / 2)\n", + "m = Map(center=center, zoom=info.minzoom, basemap={})\n", "\n", "layer = TileLayer(\n", " url=\"http://127.0.0.1:8080/tiles/WebMercatorQuad/{z}/{x}/{y}\",\n", @@ -224,11 +265,13 @@ }, "outputs": [], "source": [ - "with COGReader(src_path, tms=morecantile.tms.get(\"WorldCRS84Quad\")) as cog:\n", + "with Reader(src_path, tms=morecantile.tms.get(\"WorldCRS84Quad\")) as cog:\n", " info = cog.info()\n", "print(info.dict(exclude_none=True))\n", "\n", - "m = Map(center=(30.96, -87.90), zoom=info.minzoom, basemap={}, crs=projections.EPSG4326)\n", + "bounds = info.bounds\n", + "center = ((bounds[1] + bounds[3]) / 2, (bounds[0] + bounds[2]) / 2)\n", + "m = Map(center=center, zoom=info.minzoom, basemap={}, crs=projections.EPSG4326)\n", "\n", "layer = TileLayer(\n", " url=\"http://127.0.0.1:8080/tiles/WorldCRS84Quad/{z}/{x}/{y}\",\n", @@ -242,7 +285,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 11, "metadata": {}, "outputs": [], "source": [ @@ -259,7 +302,7 @@ ], "metadata": { "kernelspec": { - "display_name": "Python 3", + "display_name": "Python 3 (ipykernel)", "language": "python", "name": "python3" }, @@ -273,7 +316,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.8.2" + "version": "3.9.13" } }, "nbformat": 4, diff --git a/docs/src/intro.md b/docs/src/intro.md index 490dbea1..0049cbc6 100644 --- a/docs/src/intro.md +++ b/docs/src/intro.md @@ -1,20 +1,24 @@ ## Read data +`rio-tiler` has **Readers** classes which have methods to access data in `Tile`, `Part` (bbox), `Feature` (GeoJSON), `Point` (lon, lat) or as a whole. + +Here is a quick overview of how to use rio-tiler's main reader `rio_tiler.io.rasterio.Reader`: + ```python -from rio_tiler.io import COGReader -from rio_tiler.models import ImageData +from rio_tiler.io import Reader +from rio_tiler.models import ImageData, PointData tile_x = 691559 tile_y = 956905 tile_zoom = 21 -with COGReader( +with Reader( "http://oin-hotosm.s3.amazonaws.com/5a95f32c2553e6000ce5ad2e/0/10edab38-1bdd-4c06-b83d-6e10ac532b7d.tif" -) as cog: +) as dst: # Read data for a slippy map tile - img = cog.tile(tile_x, tile_y, tile_zoom, tilesize=256) - assert isinstance(img, ImageData) + img = dst.tile(tile_x, tile_y, tile_zoom, tilesize=256) + assert isinstance(img, ImageData) # Image methods return data as rio_tiler.models.ImageData object print(img.data.shape) >>> (3, 256, 256) @@ -22,68 +26,68 @@ with COGReader( >>> (256, 256) # Read the entire data - img = cog.read() + img = dst.read() print(img.data.shape) >>> (3, 11666, 19836) # Read part of a data for a given bbox (we use `max_size=1024` to limit the data transfer and read lower resolution data) - img = cog.part([-61.281, 15.539, -61.279, 15.541], max_size=1024) + img = dst.part([-61.281, 15.539, -61.279, 15.541], max_size=1024) print(img.data.shape) >>> (3, 1024, 1024) # Read data for a given geojson polygon (we use `max_size=1024` to limit the data transfer and read lower resolution data) - img = cog.feature(geojson_feature, max_size=1024) + img = dst.feature(geojson_feature, max_size=1024) # Get a preview (size is maxed out to 1024 by default to limit the data transfer and read lower resolution data) - img = cog.preview() + img = dst.preview() print(img.data.shape) >>> (3, 603, 1024) # Get pixel values for a given lon/lat coordinate - values = cog.point(-61.281, 15.539) - print(values) + values = dst.point(-61.281, 15.539) + assert isinstance(img, PointData) # Point methods return data as rio_tiler.models.PointData object + print(values.data) >>> [47, 62, 43] - - # You can also use the `old style` notation - data, mask = cog.tile(691559, 956905, 21, tilesize=256) - print(data.shape) - >>> (3, 256, 256) - print(mask.shape) - >>> (256, 256) ``` -The `COGReader` class has other interesting features, please see [User Guide - Readers](readers.md). +The `rio_tiler.io.rasterio.Reader` class has other interesting features, please see [User Guide - Readers](readers.md). ## Render the data as an image (PNG/JPEG) ```python -with COGReader( +with Reader( "http://oin-hotosm.s3.amazonaws.com/5a95f32c2553e6000ce5ad2e/0/10edab38-1bdd-4c06-b83d-6e10ac532b7d.tif" -) as cog: - img = cog.tile(691559, 956905, 21, tilesize=256) - buff = img.render() # this returns a buffer (PNG by default) +) as dst: + img = dst.tile(691559, 956905, 21, tilesize=256) + + # Encode the data in PNG (default) + buff = img.render() + + # Encode the data in JPEG + buff = img.render(img_format="JPEG") ``` ## Rescale non-byte data and/or apply colormap ```python -with COGReader( - "s3://landsat-pds/c1/L8/015/029/LC08_L1GT_015029_20200119_20200119_01_RT/LC08_L1GT_015029_20200119_20200119_01_RT_B8.TIF", - nodata=0, -) as cog: - img = cog.tile(150, 187, 9) +from rio_tiler.colormap import cmap + +# Get Colormap +cm = cmap.get("viridis") + +with Reader( + "https://sentinel-cogs.s3.amazonaws.com/sentinel-s2-l2a-cogs/29/R/KH/2020/2/S2A_29RKH_20200219_0_L2A/B01.tif", +) as dst: + img = dst.tile(239, 220, 9) # Rescale the data from 0-10000 to 0-255 - image_rescale = img.post_process( + img.rescale( in_range=((0, 10000),), out_range=((0, 255),), ) - # Get Colormap - cm = cmap.get("viridis") - # Apply colormap and create a PNG buffer - buff = image_rescale.render(colormap=cm) # this returns a buffer (PNG by default) + buff = img.render(colormap=cm) # this returns a buffer (PNG by default) ``` ## Use creation options to match `mapnik` defaults. @@ -91,10 +95,10 @@ with COGReader( ```python from rio_tiler.profiles import img_profiles -with COGReader( +with Reader( "http://oin-hotosm.s3.amazonaws.com/5a95f32c2553e6000ce5ad2e/0/10edab38-1bdd-4c06-b83d-6e10ac532b7d.tif" -) as cog: - img = cog.tile(691559, 956905, 21, tilesize=256) +) as dst: + img = dst.tile(691559, 956905, 21, tilesize=256) options = img_profiles.get("webp") @@ -119,16 +123,15 @@ with open("my.png", "wb") as f: You can also export image data to a numpy binary format (`NPY`). ```python -with COGReader( - "s3://landsat-pds/c1/L8/015/029/LC08_L1GT_015029_20200119_20200119_01_RT/LC08_L1GT_015029_20200119_20200119_01_RT_B8.TIF", - nodata=0, -) as cog: - img = cog.tile(150, 187, 9) +with Reader( + "https://sentinel-cogs.s3.amazonaws.com/sentinel-s2-l2a-cogs/29/R/KH/2020/2/S2A_29RKH_20200219_0_L2A/B01.tif", +) as dst: + img = dst.tile(239, 220, 9) buff = img.render(img_format="npy") npy_tile = numpy.load(BytesIO(buff)) - assert npy_tile.shape == (2, 256, 256) # mask is appened to the end of the data + assert npy_tile.shape == (2, 256, 256) # mask is added to the end of the data buff = img.render(img_format="npy", add_mask=False) diff --git a/docs/src/models.md b/docs/src/models.md index f0ec045a..dc6423c4 100644 --- a/docs/src/models.md +++ b/docs/src/models.md @@ -14,6 +14,7 @@ This class has helper methods like `render` which forward internal data and mask - **crs**: coordinate reference system for the data ([rasterio.crs.CRS](https://github.com/rasterio/rasterio/blob/master/rasterio/crs.py#L21), optional) - **metadata**: additional metadata (dict, optional) - **band_names**: image band's names +- **dataset_statistics**: Dataset's min/max values (list of (min,max), optional) ```python import numpy @@ -30,7 +31,7 @@ print(ImageData(d, m)) bounds=None, crs=None, metadata={}, - band_names=['1', '2', '3'], + band_names=['b1', 'b2', 'b3'], ) ``` @@ -76,7 +77,7 @@ print(image.shape) >>> (256, 256, 3) ``` -- **post_process()**: Apply rescaling or/and rio-color formula to the data array. Returns a new ImageData instance. +- **post_process**: Apply rescaling or/and rio-color formula to the data array. Returns a new ImageData instance. ```python import numpy @@ -116,6 +117,80 @@ image = img.post_process( assert isinstance(image, ImageData) ``` +- **rescale()**: linear rescaling of the data in place + +!!! info "New in version 3.1.5" + +```python +import numpy +from rio_tiler.models import ImageData + +d = numpy.random.randint(0, 3000, (3, 256, 256)) +m = numpy.zeros((256, 256)) + 255 + +img = ImageData(d, m) + +print(img.data.dtype) +>>> 'int64' + +print(img.data.max()) +>>> 2999 + +# rescale and apply rio-color formula +img.rescale(in_range=((0, 3000),),) +print(img.data.max()) +>>> 254 + +print(img.data.dtype) +>>> 'uint8' +``` + +- **apply_color_formula()**: Apply `rio-color`'s color formula in place + +!!! info "New in version 3.1.5" + +```python +import numpy +from rio_tiler.models import ImageData + +d = numpy.random.randint(0, 3000, (3, 256, 256)) +m = numpy.zeros((256, 256)) + 255 + +img = ImageData(d, m) + +print(img.data.dtype) +>>> 'int64' + +img.apply_color_formula("Gamma RGB 3.1") +print(img.data.dtype) +>>> 'uint8' +``` + +- **apply_expression()**: Apply band math expression + +!!! info "New in version 4.0" + +```python +import numpy +from rio_tiler.models import ImageData + +d = numpy.random.randint(0, 3000, (3, 256, 256)) +m = numpy.zeros((256, 256)) + 255 + +img = ImageData(d, m) +print(img.band_names) +>>> ["b1", "b2", "b3"] # Defaults + +ratio = img.apply_expression("b1/b2") # Returns a new ImageData object +assert isinstance(ratio, ImageData) + +print(ratio.band_names) +>>> ["b1/b2"] + +print(ratio.data.shape) +>>> (1, 256, 256) +``` + - **render()**: Render the data/mask to an image buffer (forward data and mask to rio_tiler.utils.render). ```python @@ -165,14 +240,91 @@ print(get_meta(buf)) Note: Starting with `rio-tiler==2.1`, when the output datatype is not valid for a driver (e.g `float` for `PNG`), `rio-tiler` will automatically rescale the data using the `min/max` value for the datatype (ref: https://github.com/cogeotiff/rio-tiler/pull/391). + +## PointData + +!!! info "New in version 4.0" + +#### Attributes + +- **data**: point array (numpy.ndarray) +- **mask**: gdal/rasterio mask array (numpy.ndarray) +- **assets**: assets list used to create the data array (list, optional) +- **coordinates**: Coordinates of the point (Tuple[float, float], optional) +- **crs**: coordinate reference system for the data ([rasterio.crs.CRS](https://github.com/rasterio/rasterio/blob/master/rasterio/crs.py#L21), optional) +- **metadata**: additional metadata (dict, optional) +- **band_names**: values band's names + +```python +import numpy +from rio_tiler.models import PointData + +d = numpy.zeros((3)) +m = numpy.zeros((1), dtype="uint8") + 255 + +print(PointData(d, m)) +>>> PointData( + data=array([0., 0., 0.]), + mask=array([255]), + assets=None, + coordinates=None, + crs=None, + metadata={}, + band_names=['b1', 'b2', 'b3'], +) +``` + +#### Properties + +- **count**: number of bands in the data array (int) + +#### Methods + +- **as_masked()**: Return the data array as a `numpy.ma.MaskedArray` + +```python +import numpy +from rio_tiler.models import PointData + +d = numpy.zeros((3)) +m = numpy.zeros((1), dtype="uint8") + 255 + +masked = PointData(d, m).as_masked() +print(type(masked)) +>>> numpy.ma.core.MaskedArray +``` + +- **apply_expression()**: Apply band math expression + +```python +import numpy +from rio_tiler.models import PointData + +d = numpy.random.randint(0, 3000, (3)) +m = numpy.zeros((1), dtype="uint8") + 255 + +pts = PointData(d, m) +print(pts.band_names) +>>> ["b1", "b2", "b3"] # Defaults + +ratio = pts.apply_expression("b1/b2") # Returns a new PointData object +assert isinstance(ratio, PointData) + +print(ratio.band_names) +>>> ["b1/b2"] + +print(ratio.count) +>>> 1 +``` + ## Others -Readers methods (`info`, `metadata` and `stats`) returning metadata like results return [pydantic](https://pydantic-docs.helpmanual.io) models to make sure the values are valids. +Readers methods returning metadata like results (`info()` and `statistics()`) return [pydantic](https://pydantic-docs.helpmanual.io) models to make sure the values are valids. ### Info ```python -from rio_tiler.io import COGReader +from rio_tiler.io import Reader from rio_tiler.models import Info # Schema @@ -308,10 +460,10 @@ print(Info.schema()) } # Example -with COGReader( +with Reader( "http://oin-hotosm.s3.amazonaws.com/5a95f32c2553e6000ce5ad2e/0/10edab38-1bdd-4c06-b83d-6e10ac532b7d.tif" -) as cog: - info = cog.info() +) as src: + info = src.info() print(info["nodata_type"]) >>> "None" @@ -324,8 +476,8 @@ print(info.json(exclude_none=True)) 'bounds': [-61.287001876638215, 15.537756794450583, -61.27877967704677, 15.542486503997608], 'minzoom': 16, 'maxzoom': 22, - 'band_metadata': [('1', {}), ('2', {}), ('3', {})], - 'band_descriptions': [('1', ''), ('2', ''), ('3', '')], + 'band_metadata': [('b1', {}), ('b2', {}), ('b3', {})], + 'band_descriptions': [('b1', ''), ('b2', ''), ('b3', '')], 'dtype': 'uint8', 'nodata_type': 'None', 'colorinterp': ['red', 'green', 'blue'], @@ -337,12 +489,12 @@ print(info.json(exclude_none=True)) } ``` -Note: starting with `rio-tiler>=2.0.8`, additional metadata can be set (e.g. driver, count, width, height, overviews in `COGReader.info()`) +Note: starting with `rio-tiler>=2.0.8`, additional metadata can be set (e.g. driver, count, width, height, overviews in `Reader.info()`) ### BandStatistics ```python -from rio_tiler.io import COGReader +from rio_tiler.io import Reader from rio_tiler.models import BandStatistics # Schema @@ -441,19 +593,19 @@ print(BandStatistics.schema()) } # Example -with COGReader( +with Reader( "http://oin-hotosm.s3.amazonaws.com/5a95f32c2553e6000ce5ad2e/0/10edab38-1bdd-4c06-b83d-6e10ac532b7d.tif" -) as cog: - stats = cog.statistics() - assert isinstance(stats["1"], BandStatistics) +) as src: + stats = src.statistics() + assert isinstance(stats["b1"], BandStatistics) -print(stats["1"]["min"]) +print(stats["b1"]["min"]) >>> 0.0 -print(stats["1"].min) +print(stats["b1"].min) >>> 0.0 -print(stats["1"].json(exclude_none=True)) +print(stats["b1"].json(exclude_none=True)) >>> { "min": 0, "max": 255, diff --git a/docs/src/mosaic.md b/docs/src/mosaic.md index 8fa6bce6..f0b579d8 100644 --- a/docs/src/mosaic.md +++ b/docs/src/mosaic.md @@ -53,14 +53,14 @@ Returns: ### Examples ```python -from rio_tiler.io import COGReader +from rio_tiler.io import Reader from rio_tiler.mosaic import mosaic_reader from rio_tiler.mosaic.methods import defaults from rio_tiler.models import ImageData def tiler(src_path: str, *args, **kwargs) -> ImageData: - with COGReader(src_path) as cog: + with Reader(src_path) as cog: return cog.tile(*args, **kwargs) mosaic_assets = ["mytif1.tif", "mytif2.tif", "mytif3.tif"] diff --git a/docs/src/readers.md b/docs/src/readers.md index b23a2f6b..e97588b9 100644 --- a/docs/src/readers.md +++ b/docs/src/readers.md @@ -1,16 +1,16 @@ -`rio-tiler`'s COGReader and STACReader are built from its abstract base classes (`AsyncBaseReader`, `BaseReader`, `MultiBandReader`, `MultiBaseReader`). Those Classes implements defaults interfaces which helps the integration in broader application. To learn more about `rio-tiler`'s base classes see [Base classes and custom readers](advanced/custom_readers.md) +`rio-tiler`'s Reader are built from its abstract base classes (`BaseReader`, `MultiBandReader`, `MultiBaseReader`). Those Classes implements defaults interfaces which helps the integration in broader application. To learn more about `rio-tiler`'s base classes see [Base classes and custom readers](advanced/custom_readers.md) -## rio_tiler.io.COGReader +## rio_tiler.io.rasterio.Reader -The `COGReader` is designed to work with simple raster datasets (e.g COG, GeoTIFF, ...). +The `Reader` is designed to work with simple raster datasets (e.g COG, GeoTIFF, ...). The class is derived from the `rio_tiler.io.base.BaseReader` base class. ```python -from rio_tiler.io import COGReader +from rio_tiler.io import Reader -COGReader.__mro__ ->>> (rio_tiler.io.cogeo.COGReader, +Reader.__mro__ +>>> (rio_tiler.io.rasterio.Reader, rio_tiler.io.base.BaseReader, rio_tiler.io.base.SpatialMixin, object) @@ -21,29 +21,30 @@ COGReader.__mro__ - **input** (str): filepath - **dataset** (rasterio dataset, optional): rasterio opened dataset - **tms** (morecantile.TileMatrixSet, optional): morecantile TileMatrixSet used for tile reading (defaults to WebMercator) -- **minzoom** (int, optional): dataset's minimum zoom level (for input tms) -- **maxzoom** (int, optional): dataset's maximum zoom level (for input tms) +- **geographic_crs** (rasterio.crs.CRS, optional): CRS to use to calculate the geographic bounds (default to WGS84) - **colormap** (dict, optional): dataset's colormap +- **options** (rio_tiler.reader.Options, optional): Options to forward to rio_tiler.reader functions (e.g nodata, vrt_options, resampling) #### Properties - **bounds**: dataset's bounds (in dataset crs) - **crs**: dataset's crs - **geographic_bounds**: dataset's bounds in WGS84 - +- **minzoom**: dataset minzoom (in TMS) +- **maxzoom**: dataset maxzoom (in TMS) ```python -from rio_tiler.io import COGReader - -with COGReader("myfile.tif") as cog: - print(cog.dataset) - print(cog.tms.identifier) - print(cog.minzoom) - print(cog.maxzoom) - print(cog.bounds) - print(cog.crs) - print(cog.geographic_bounds) - print(cog.colormap) +from rio_tiler.io import Reader + +with Reader("myfile.tif") as src: + print(src.dataset) + print(src.tms.identifier) + print(src.minzoom) + print(src.maxzoom) + print(src.bounds) + print(src.crs) + print(src.geographic_bounds) + print(src.colormap) >> WebMercatorQuad @@ -60,51 +61,53 @@ EPSG:32620 - **read()**: Read the entire dataset ```python -from rio_tiler.io import COGReader +from rio_tiler.io import Reader from rio_tiler.models import ImageData -with COGReader("myfile.tif") as cog: - img = cog.read() +with Reader("myfile.tif") as src: + img = src.read() assert isinstance(img, ImageData) - assert img.crs == cog.dataset.crs + assert img.crs == src.dataset.crs assert img.assets == ["myfile.tif"] - assert img.width == cog.dataset.width - assert img.height == cog.dataset.height - assert img.count == cog.dataset.count + assert img.width == src.dataset.width + assert img.height == src.dataset.height + assert img.count == src.dataset.count # With indexes -with COGReader("myfile.tif") as cog: - img = cog.read(indexes=1) # or cog.read(indexes=(1,)) +with Reader("myfile.tif") as src: + img = src.read(indexes=1) # or src.read(indexes=(1,)) assert img.count == 1 + assert img.band_names == ["b1"] # With expression -with COGReader("myfile.tif") as cog: - img = cog.read(expression="B1/B2") +with Reader("myfile.tif") as src: + img = src.read(expression="b1/b2") assert img.count == 1 + assert img.band_names == ["b1/b2"] ``` - **tile()**: Read map tile from a raster ```python from rio_tiler.contants import WEB_MERCATOR_CRS -from rio_tiler.io import COGReader +from rio_tiler.io import Reader from rio_tiler.models import ImageData -with COGReader("myfile.tif") as cog: - # cog.tile(tile_x, tile_y, tile_z, **kwargs) - img = cog.tile(1, 2, 3, tilesize=256) +with Reader("myfile.tif") as src: + # src.tile(tile_x, tile_y, tile_z, **kwargs) + img = src.tile(1, 2, 3, tilesize=256) assert isinstance(img, ImageData) assert img.crs == WEB_MERCATOR_CRS assert img.assets == ["myfile.tif"] # With indexes -with COGReader("myfile.tif") as cog: - img = cog.tile(1, 2, 3, tilesize=256, indexes=1) +with Reader("myfile.tif") as src: + img = src.tile(1, 2, 3, tilesize=256, indexes=1) assert img.count == 1 # With expression -with COGReader("myfile.tif") as cog: - img = cog.tile(1, 2, 3, tilesize=256, expression="B1/B2") +with Reader("myfile.tif") as src: + img = src.tile(1, 2, 3, tilesize=256, expression="B1/B2") assert img.count == 1 # Using buffer @@ -112,14 +115,14 @@ with COGReader("myfile.tif") as cog: # ref: # - https://github.com/cogeotiff/rio-tiler/issues/365 # - https://github.com/cogeotiff/rio-tiler/pull/405 -with COGReader("myfile.tif") as cog: +with Reader("myfile.tif") as src: # add 0.5 pixel on each side of the tile - img = cog.tile(1, 2, 3, tile_buffer=0.5) + img = src.tile(1, 2, 3, buffer=0.5) assert img.width == 257 assert img.height == 257 # add 1 pixel on each side of the tile - img = cog.tile(1, 2, 3, tile_buffer=1) + img = src.tile(1, 2, 3, buffer=1) assert img.width == 258 assert img.height == 258 ``` @@ -127,40 +130,40 @@ with COGReader("myfile.tif") as cog: - **part()**: Read a raster for a given bounding box (`bbox`). By default the bbox is considered to be in WGS84. ```python -from rio_tiler.io import COGReader +from rio_tiler.io import Reader from rio_tiler.models import ImageData -with COGReader("myfile.tif") as cog: - # cog.part((minx, miny, maxx, maxy), **kwargs) - img = cog.part((10, 10, 20, 20)) +with Reader("myfile.tif") as src: + # src.part((minx, miny, maxx, maxy), **kwargs) + img = src.part((10, 10, 20, 20)) assert isinstance(img, ImageData) assert img.crs == WGS84_CRS assert img.assets == ["myfile.tif"] assert img.bounds == (10, 10, 20, 20) -# Pass bbox in WGS84 (default) but return data in the input COG CRS -with COGReader("myfile.tif") as cog: - img = cog.part((10, 10, 20, 20), dst_crs=cog.dataset.crs) - assert img.crs == cog.dataset.crs +# Pass bbox in WGS84 (default) but return data in the input dataset CRS +with Reader("myfile.tif") as src: + img = src.part((10, 10, 20, 20), dst_crs=src.dataset.crs) + assert img.crs == src.dataset.crs # Limit output size -with COGReader("myfile.tif") as cog: - img = cog.part((10, 10, 20, 20), max_size=2000) +with Reader("myfile.tif") as src: + img = src.part((10, 10, 20, 20), max_size=2000) # With indexes -with COGReader("myfile.tif") as cog: - img = cog.part((10, 10, 20, 20), indexes=1) +with Reader("myfile.tif") as src: + img = src.part((10, 10, 20, 20), indexes=1) # With expression -with COGReader("myfile.tif") as cog: - img = cog.part((10, 10, 20, 20), expression="B1/B2") +with Reader("myfile.tif") as src: + img = src.part((10, 10, 20, 20), expression="b1/b2") ``` - **feature()**: Read a raster for a geojson feature. By default the feature is considered to be in WGS84. ```python from rio_tiler.constants import WGS84_CRS -from rio_tiler.io import COGReader +from rio_tiler.io import Reader from rio_tiler.models import ImageData feat = { @@ -180,83 +183,87 @@ feat = { }, } -with COGReader("myfile.tif") as cog: - # cog.part(geojson_feature, **kwargs) - img = cog.feature(feat) +with Reader("myfile.tif") as src: + # src.part(geojson_feature, **kwargs) + img = src.feature(feat) assert isinstance(img, ImageData) assert img.crs == WGS84_CRS assert img.assets == ["myfile.tif"] assert img.bounds == (-55.61, 72.36, -53.83, 73.05) # bbox of the input feature -# Pass bbox in WGS84 (default) but return data in the input COG CRS -with COGReader("myfile.tif") as cog: - img = cog.feature(feat, dst_crs=cog.dataset.crs) - assert img.crs == cog.dataset.crs +# Pass bbox in WGS84 (default) but return data in the input dataset CRS +with Reader("myfile.tif") as src: + img = src.feature(feat, dst_crs=src.dataset.crs) + assert img.crs == src.dataset.crs # Limit output size -with COGReader("myfile.tif") as cog: - img = cog.feature(feat, max_size=2000) +with Reader("myfile.tif") as src: + img = src.feature(feat, max_size=2000) # Read high resolution -with COGReader("myfile.tif") as cog: - img = cog.feature(feat, max_size=None) +with Reader("myfile.tif") as src: + img = src.feature(feat, max_size=None) # With indexes -with COGReader("myfile.tif") as cog: - img = cog.feature(feat, indexes=1) +with Reader("myfile.tif") as src: + img = src.feature(feat, indexes=1) # With expression -with COGReader("myfile.tif") as cog: - img = cog.feature(feat, expression="B1/B2") +with Reader("myfile.tif") as src: + img = src.feature(feat, expression="b1/b2") ``` - **preview()**: Read a preview of a raster ```python -from rio_tiler.io import COGReader +from rio_tiler.io import Reader from rio_tiler.models import ImageData -with COGReader("myfile.tif") as cog: - img = cog.preview() +with Reader("myfile.tif") as src: + img = src.preview() assert isinstance(img, ImageData) # With indexes -with COGReader("myfile.tif") as cog: - img = cog.preview(indexes=1) +with Reader("myfile.tif") as src: + img = src.preview(indexes=1) # With expression -with COGReader("myfile.tif") as cog: - img = cog.preview(expression="B1+2,B1*4") +with Reader("myfile.tif") as src: + img = src.preview(expression="b1+2;b1*4") ``` -- **point()**: Read the pixel values of a raster for a given `lon, lat` coordinates. By default the coordinates are considered to be in WGS84. +- **point()**: Read the pixel values of a raster for a given `lon, lat` coordinates. By default the coordinates are considered to be in WGS84. ```python -from rio_tiler.io import COGReader +from rio_tiler.io import Reader +from rio_tiler.models import PointData -with COGReader("myfile.tif") as cog: - # cog.point(lon, lat) - print(cog.point(-100, 25)) +with Reader("myfile.tif") as src: + # src.point(lon, lat) + pt = src.point(-100, 25) + assert isinstance(pt, PointData) # With indexes -with COGReader("myfile.tif") as cog: - print(cog.point(-100, 25, indexes=1)) +with Reader("myfile.tif") as src: + pt = src.point(-100, 25, indexes=1) + print(pt.data) >>> [1] # With expression -with COGReader("myfile.tif") as cog: - print(cog.point(-100, 25, expression="B1+2,B1*4")) +with Reader("myfile.tif") as src: + pt = src.point(-100, 25, expression="b1+2;b1*4") + print(pt.data) >>> [3, 4] ``` - **info()**: Return simple metadata about the dataset ```python -from rio_tiler.io import COGReader +from rio_tiler.io import Reader from rio_tiler.models import Info -with COGReader("myfile.tif") as cog: - info = cog.info() +with Reader("myfile.tif") as src: + info = src.info() assert isinstance(info, Info) print(info.dict(exclude_none=True)) @@ -264,8 +271,8 @@ print(info.dict(exclude_none=True)) "bounds": [-119.05915661478785, 13.102845359730287, -84.91821332299578, 33.995073647795806], "minzoom": 3, "maxzoom": 12, - "band_metadata": [["1", {}]], - "band_descriptions": [["1", ""]], + "band_metadata": [["b1", {}]], + "band_descriptions": [["b1", ""]], "dtype": "int8", "colorinterp": ["palette"], "nodata_type": "Nodata", @@ -285,21 +292,21 @@ print(info.dict(exclude_none=True)) - **statistics()**: Return image statistics (Min/Max/Stdev) ```python -from rio_tiler.io import COGReader +from rio_tiler.io import Reader -with COGReader("myfile.tif") as cog: - stats = cog.statistics() +with Reader("myfile.tif") as src: + stats = src.statistics() assert isinstance(stats, dict) # stats will be in form or {"band": BandStatistics(), ...} print(stats) >>> { - '1': BandStatistics(...), - '2': BandStatistics(...), - '3': BandStatistics(...) + 'b1': BandStatistics(...), + 'b2': BandStatistics(...), + 'b3': BandStatistics(...) } -print(stats["1"].dict()) +print(stats["b1"].dict()) >>> { "min": 1, "max": 7872, @@ -322,16 +329,16 @@ print(stats["1"].dict()) "percentile_2": 1 } -with COGReader("myfile_with_colormap.tif") as cog: - stats = cog.statistics(categorical=True, categories=[1, 2]) # we limit the categories to 2 defined value (defaults to all dataset values) +with Reader("myfile_with_colormap.tif") as src: + stats = src.statistics(categorical=True, categories=[1, 2]) # we limit the categories to 2 defined value (defaults to all dataset values) assert isinstance(stats, dict) print(stats) >>> { - '1': BandStatistics(...) + 'b1': BandStatistics(...) } # For categorical data, the histogram will represent the density of EACH value. -print(stats["1"].dict()) +print(stats["b1"].dict()) >>> { ... "histogram": [ @@ -344,7 +351,7 @@ print(stats["1"].dict()) #### Read Options -`COGReader` accepts several input options which will be forwarded to the `rio_tiler.reader.read` function (low level function accessing the data), those options can be set as reader's attribute or within each method calls: +`Reader` accepts several input options which will be forwarded to the `rio_tiler.reader.read` function (low level function accessing the data), those options can be set as reader's attribute or within each method calls: - **nodata**: Overwrite the nodata value (or set if not present) - **unscale**: Apply internal rescaling factors @@ -353,16 +360,16 @@ print(stats["1"].dict()) - **post_process**: Function to apply after the read operations ```python -with COGReader("my_cog.tif", nodata=0) as cog: - cog.tile(1, 1, 1) +with Reader("my_cog.tif", options={"nodata": 0}) as src: + src.tile(1, 1, 1) # is equivalent to -with COGReader("my_cog.tif") as cog: - cog.tile(1, 1, 1, nodata=0) +with Reader("my_cog.tif") as src: + src.tile(1, 1, 1, nodata=0) ``` -## rio_tiler.io.STACReader +## rio_tiler.io.stac.STACReader In `rio-tiler` v2, we added a `rio_tiler.io.STACReader` to allow tile/metadata fetching of assets withing a STAC item. @@ -385,11 +392,12 @@ STACReader.__mro__ - **tms** (morecantile.TileMatrixSet, optional): morecantile TileMatrixSet used for tile reading (defaults to WebMercator) - **minzoom** (int, optional): dataset's minimum zoom level (for input tms) - **maxzoom** (int, optional): dataset's maximum zoom level (for input tms) +- **geographic_crs** (rasterio.crs.CRS, optional): CRS to use to calculate the geographic bounds (default to WGS84) - **include_assets** (set, optional): Set of assets to include from the `available` asset list - **exclude_assets** (set, optional): Set of assets to exclude from the `available` asset list - **include_asset_types** (set, optional): asset types to consider as valid type for the reader - **exclude_asset_types** (set, optional): asset types to consider as invalid type for the reader -- **reader** (BaseReader, optional): Reader to use to read assets (defaults to COGReader) +- **reader** (BaseReader, optional): Reader to use to read assets (defaults to rio_tiler.io.rasterio.Reader) - **reader_options** (dict, optional): Options to forward to the reader init - **fetch_options** (dict, optional): Options to pass to the `httpx.get` or `boto3` when fetching the STAC item @@ -430,7 +438,7 @@ EPSG:4326 #### Methods -The `STACReader` has the same methods as the `COGReader` (defined by the BaseReader/MultiBaseReader classes). +The `STACReader` has the same methods as the `Reader` (defined by the BaseReader/MultiBaseReader classes). !!! Important - Most of `STACReader` methods require to set either `assets=` or `expression=` option. @@ -461,7 +469,7 @@ print(img.assets) 'https://sentinel-cogs.s3.us-west-2.amazonaws.com/sentinel-s2-l2a-cogs/34/S/GA/2020/3/S2A_34SGA_20200318_0_L2A/B02.tif', ] print(img.band_names) ->>> ['B01_1', 'B02_1'] +>>> ['B01_b1', 'B02_b1'] # Using `expression=` with STACReader(stac_url, exclude_assets={"thumbnail"}) as stac: @@ -470,26 +478,10 @@ with STACReader(stac_url, exclude_assets={"thumbnail"}) as stac: 103, 8, tilesize=256, - expression="B01/B02", + expression="B01_b1/B02_b1", ) assert img.count == 1 - -# Using `assets=` + `asset_expression` (apply band math in an asset) -with STACReader(stac_url, exclude_assets={"thumbnail"},) as stac: - img = stac.tile( - 145, - 103, - 8, - tilesize=256, - assets=["B01", "B02"], - asset_expression={ - "B01": "b1+500", # add 500 to the first band - "B02": "b1-100", # substract 100 to the first band - } - ) - assert img.count == 2 - # Using `assets=` + `asset_indexes` (select a specific index in an asset) with STACReader(stac_url, exclude_assets={"thumbnail"},) as stac: img = stac.tile( @@ -548,17 +540,17 @@ with STACReader(stac_url, exclude_assets={"thumbnail"},) as stac: assert img.count == 2 # each assets have one band ``` -- **point()**: Read the pixel values for assets for a given `lon, lat` coordinates. By default the coordinates are considered to be in WGS84. +- **point()**: Read the pixel values for assets for a given `lon, lat` coordinates. By default the coordinates are considered to be in WGS84. ```python with STACReader(stac_url, exclude_assets={"thumbnail"},) as stac: # stac.point(lon, lat, assets=?, expression=?, asset_expression=?, asset_indexes=?, **kwargs) data = stac.point(24.1, 31.9, assets=["B01", "B02"]) -print(data) +print(data.data) >>> [ - [3595], # values for B01 - [3198] # values for B02 + 3595, # values for B01 + 3198 # values for B02 ] ``` @@ -577,8 +569,8 @@ print(info["B01"].json(exclude_none=True)) "bounds": [23.106076243528157, 31.505173744374172, 24.296464503939948, 32.519334871696195], "minzoom": 8, "maxzoom": 11, - "band_metadata": [["1", {}]], - "band_descriptions": [["1", ""]], + "band_metadata": [["b1", {}]], + "band_descriptions": [["b1", ""]], "dtype": "uint16", "nodata_type": "Nodata", "colorinterp": ["gray"], @@ -603,9 +595,9 @@ print(list(stats)) >>> ["B01", "B02"] print(list(stats["B01"])) ->>> ["1"] # B01 has only one band entry "1" +>>> ["b1"] # B01 has only one band entry "1" -print(stats["B01"]["1"].json(exclude_none=True)) +print(stats["B01"]["b1"].json(exclude_none=True)) { "min": 283.0, "max": 7734.0, @@ -640,11 +632,11 @@ with STACReader(stac_url, exclude_assets={"thumbnail"},) as stac: # stats will be in form or {"band": BandStatistics(), ...} print(list(stats)) ->>> ["B01_1", "B02_1"] +>>> ["B01_b1", "B02_b1"] -assert isinstance(stats["B01_1"], BandStatistics) +assert isinstance(stats["B01_b1"], BandStatistics) -print(info["B01_1"].json(exclude_none=True)) +print(info["B01_b1"].json(exclude_none=True)) { "min": 283.0, "max": 7734.0, @@ -669,16 +661,511 @@ print(info["B01_1"].json(exclude_none=True)) with STACReader(stac_url, exclude_assets={"thumbnail"},) as stac: # stac.statistics(assets=?, asset_expression=?, asset_indexes=?, **kwargs) - stats = stac.merged_statistics(expression=["B01/B02"], max_size=128) + stats = stac.merged_statistics(expression=["B01_b1/B02_b1"], max_size=128) print(list(stats)) ->>> ["B01/B02"] +>>> ["B01_b1/B02_b1"] -assert isinstance(stats["B01/B02"], BandStatistics) +assert isinstance(stats["B01_b1/B02_b1"], BandStatistics) ``` ### STAC Expression -When using `expression`, the reader might consider assets as `1 band` data. Expression using multi bands are not supported (e.g: `asset1_b1 + asset2_b2`). +When using `expression`, the user will need to explicitly pass the band number to use within the asset e.g: `asset1_b1 + asset2_b2`. + + +## rio_tiler.io.rasterio.ImageReader + +The `Reader` is designed to work with simple raster datasets in their pixel coordinates. + +The class is derived from the `rio_tiler.io.rasterio.Reader` class. +```python +from rio_tiler.io import ImageReader + +ImageReader.__mro__ +>>> (rio_tiler.io.rasterio.ImageReader, + rio_tiler.io.rasterio.Reader, + rio_tiler.io.base.BaseReader, + rio_tiler.io.base.SpatialMixin, + object) +``` + +#### Attributes + +- **input** (str): filepath +- **dataset** (rasterio dataset, optional): rasterio opened dataset +- **colormap** (dict, optional): dataset's colormap +- **options** (rio_tiler.reader.Options, optional): Options to forward to rio_tiler.reader functions (e.g nodata, vrt_options, resampling) + +#### Properties + +- **bounds**: dataset's bounds (in dataset crs) +- **transform**: dataset Affine transform (in pixel coordinates) +- **minzoom**: dataset minzoom +- **maxzoom**: dataset maxzoom + +```python +from rio_tiler.io import ImageReader + +with ImageReader("image.jpg") as src: + print(src.dataset) + print(src.minzoom) + print(src.maxzoom) + print(src.transform) + print(src.bounds) + print(src.colormap) + +>> +0 +3 +Affine(1.0, 0.0, 0.0, 0.0, 1.0, 0.0) +(0, 2000, 2000, 0) +{} +``` + +#### Methods + +- **read()**: Read the entire dataset + +```python +from rio_tiler.io import ImageReader +from rio_tiler.models import ImageData + +with ImageReader("image.jpeg") as src: + img = src.read() + assert isinstance(img, ImageData) + assert not img.crs + assert img.assets == ["image.jpeg"] + assert img.width == src.dataset.width + assert img.height == src.dataset.height + assert img.count == src.dataset.count + +# With indexes +with ImageReader("image.jpeg") as src: + img = src.read(indexes=1) # or src.read(indexes=(1,)) + assert img.count == 1 + assert img.band_names == ["b1"] + +# With expression +with ImageReader("image.jpeg") as src: + img = src.read(expression="b1/b2") + assert img.count == 1 + assert img.band_names == ["b1/b2"] +``` + +- **tile()**: Read tile from the image + +For ImageReader we are using a custom `LocalTileMatrixSet` constructed from the dataset width and height. The origin is the Top-Left of the image. + +```python +from rio_tiler.io import ImageReader +from rio_tiler.models import ImageData + +with ImageReader("image.jpeg") as src: + # src.tile(tile_x, tile_y, tile_z, **kwargs) + img = src.tile(0, 0, src.maxzoom) + assert isinstance(img, ImageData) + assert not img.crs + assert img.bounds == (0, 256, 256, 0) + + img = src.tile(0, 0, src.minzoom) + assert isinstance(img, ImageData) + assert img.bounds[0] == 0 + assert img.bounds[3] == 0 + +# With indexes +with ImageReader("image.jpeg") as src: + img = src.tile(1, 2, 3, tilesize=256, indexes=1) + assert img.count == 1 + +# With expression +with ImageReader("image.jpeg") as src: + img = src.tile(1, 2, 3, tilesize=256, expression="B1/B2") + assert img.count == 1 +``` + +- **part()**: Read an image for a given bounding box (`bbox`). The origin is the Top-Left of the image. -If assets have difference number of bands and the `asset_indexes` is not specified the process will fail because it will try to apply an expression using arrays of different sizes. +```python +from rio_tiler.io import ImageReader +from rio_tiler.models import ImageData + +with ImageReader("image.jpeg") as src: + # src.part((left, bottom, right, top), **kwargs) + img = src.part((0, 256, 256, 0)) # read the top-left 256x256 square of the image + assert isinstance(img, ImageData) + assert img.assets == ["myfile.tif"] + assert img.bounds == (0, 256, 256, 0) + +# Limit output size +with ImageReader("image.jpeg") as src: + img = src.part((0, 256, 256, 0), max_size=50) + +# With indexes +with ImageReader("image.jpeg") as src: + img = src.part((0, 256, 256, 0), indexes=1) + +# With expression +with ImageReader("image.jpeg") as src: + img = src.part((0, 256, 256, 0), expression="b1/b2") +``` + +- **feature()**: Read an image for a geojson feature. In the pixel coordinate system. + +```python +from rio_tiler.io import ImageReader +from rio_tiler.models import ImageData + +feat = { + "coordinates": [ + [ + [-100.0, -100.0], + [1000.0, 100.0], + [500.0, 1000.0], + [-50.0, 500.0], + [-100.0, -100.0], + ] + ], + "type": "Polygon", +} + +with ImageReader("image.jpeg") as src: + # src.part(geojson_feature, **kwargs) + img = src.feature(feat) + assert isinstance(img, ImageData) + assert img.assets == ["image.jpeg"] + assert img.bounds == (-100.0, 1000.0, 1000.0, -100.0) # bbox of the input feature + +# Limit output size +with ImageReader("image.jpeg") as src: + img = src.feature(feat, max_size=100) + +# Read high resolution +with ImageReader("image.jpeg") as src: + img = src.feature(feat, max_size=None) + +# With indexes +with ImageReader("image.jpeg") as src: + img = src.feature(feat, indexes=1) + +# With expression +with ImageReader("image.jpeg") as src: + img = src.feature(feat, expression="b1/b2") +``` + +- **preview()**: Read a preview of a raster + +```python +from rio_tiler.io import ImageReader +from rio_tiler.models import ImageData + +with ImageReader("image.jpeg") as src: + img = src.preview() + assert isinstance(img, ImageData) + +# With indexes +with ImageReader("image.jpeg") as src: + img = src.preview(indexes=1) + +# With expression +with ImageReader("image.jpeg") as src: + img = src.preview(expression="b1+2;b1*4") +``` + +- **point()**: Read the pixel values of a raster for a given `x, y` coordinates. The origin is the Top-Left of the image. + +```python +from rio_tiler.io import ImageReader +from rio_tiler.models import PointData + +with ImageReader("image.jpeg") as src: + # src.point(x, y) + pt = src.point(0, 0) # pixel at the origin + assert isinstance(pt, PointData) + +# With indexes +with ImageReader("image.jpeg") as src: + pt = src.point(0,0 , indexes=1) + print(pt.data) +>>> [1] + +# With expression +with ImageReader("image.jpeg") as src: + pt = src.point(0, 0, expression="b1+2;b1*4") + print(pt.data) +>>> [3, 4] +``` + +- **info()**: Return simple metadata about the dataset + +```python +from rio_tiler.io import ImageReader +from rio_tiler.models import Info + +with ImageReader("image.jpeg") as src: + info = src.info() + assert isinstance(info, Info) + +print(info.dict(exclude_none=True)) +>>> { + "bounds": [0, 4000, 4000, 0], + "minzoom": 0, + "maxzoom": 3, + "band_metadata": [["b1", {}]], + "band_descriptions": [["b1", ""]], + "dtype": "int8", + "colorinterp": ["palette"], + "nodata_type": "Nodata", + "colormap": { + "0": [0, 0, 0, 0], + "1": [0, 61, 0, 255], + ... + }, + "driver": "GTiff", + "count": 1, + "width": 4000, + "height": 4000, + "overviews": [2, 4, 8], +} +``` + +- **statistics()**: Return image statistics (Min/Max/Stdev) + +```python +from rio_tiler.io import ImageReader + +with ImageReader("image.jpeg") as src: + stats = src.statistics() + assert isinstance(stats, dict) + +# stats will be in form or {"band": BandStatistics(), ...} +print(stats) +>>> { + 'b1': BandStatistics(...), + 'b2': BandStatistics(...), + 'b3': BandStatistics(...) +} + +print(stats["b1"].dict()) +>>> { + "min": 1, + "max": 7872, + "mean": 2107.524612053134, + "count": 1045504, + "sum": 2203425412, + "std": 2271.0065537857326, + "median": 2800, + "majority": 1, + "minority": 7072, + "unique": 15, + "histogram": [ + [...], + [...] + ], + "valid_percent": 100, + "masked_pixels": 0, + "valid_pixels": 1045504, + "percentile_98": 6896, + "percentile_2": 1 +} +``` + + + + + + + +## rio_tiler.io.xarray.XarrayReader + +The `Reader` is designed to work with xarray.DataReader with full geo-reference metadata (CRS) and variables (X,Y) + +The class is derived from the `rio_tiler.io.base.BaseReader` class. +```python +from rio_tiler.io.xarray import XarrayReader + +XarrayReader.__mro__ +>>> (rio_tiler.io.xarray.XarrayReader, + rio_tiler.io.base.BaseReader, + rio_tiler.io.base.SpatialMixin, + object) +``` + +#### Attributes + +- **input** (xarray.DataArray): Xarray DataArray +- **tms** (morecantile.TileMatrixSet, optional): morecantile TileMatrixSet used for tile reading (defaults to WebMercator) +- **geographic_crs** (rasterio.crs.CRS, optional): CRS to use to calculate the geographic bounds (default to WGS84) + +#### Properties + +- **bounds**: dataset's bounds (in dataset crs) +- **crs**: dataset's crs +- **geographic_bounds**: dataset's bounds in WGS84 +- **minzoom**: dataset minzoom (in TMS) +- **maxzoom**: dataset maxzoom (in TMS) + + +```python +import numpy +import xarray +from datetime import datetime +from rio_tiler.io.xarray import XarrayReader + +arr = numpy.random.randn(1, 33, 35) +data = xarray.DataArray( + arr, + dims=("time", "y", "x"), + coords={ + "x": list(range(-170, 180, 10)), + "y": list(range(-80, 85, 5)), + "time": [datetime(2022, 1, 1)], + }, +) +data.attrs.update({"valid_min": arr.min(), "valid_max": arr.max()}) +data.rio.write_crs("epsg:4326", inplace=True) + +with XarrayReader(data) as src: + print(src.input) + print(src.tms.identifier) + print(src.minzoom) + print(src.maxzoom) + print(src.bounds) + print(src.crs) + print(src.geographic_bounds) + +>> +WebMercatorQuad +0 +0 +(-175.0, -82.5, 175.0, 82.5) +EPSG:4326 +(-175.0, -82.5, 175.0, 82.5) +``` + +#### Methods + +- **tile()**: Read map tile from a raster + +```python +from rio_tiler.contants import WEB_MERCATOR_CRS +from rio_tiler.io import XarrayReader +from rio_tiler.models import ImageData + +with XarrayReader(data) as src: + # src.tile(tile_x, tile_y, tile_z, tilesize, resampling_method) + img = src.tile(1, 2, 3) + assert isinstance(img, ImageData) + assert img.crs == WEB_MERCATOR_CRS +``` + +- **part()**: Read a DataArray for a given bounding box (`bbox`). By default the bbox is considered to be in WGS84. + +```python +from rio_tiler.io import XarrayReader +from rio_tiler.models import ImageData + +with XarrayReader(data) as src: + # src.part((minx, miny, maxx, maxy), dst_crs, bounds_crs, resampling_method) + img = src.part((10, 10, 20, 20)) + assert isinstance(img, ImageData) + assert img.crs == WGS84_CRS + assert img.bounds == (10, 10, 20, 20) + +# Pass bbox in WGS84 (default) but return data in the input dataset CRS +with XarrayReader(data) as src: + img = src.part((10, 10, 20, 20), dst_crs=src.dataset.crs) + assert img.crs == src.dataset.crs +``` + +- **feature()**: Read a DataArray for a geojson feature. By default the feature is considered to be in WGS84. + +```python +from rio_tiler.constants import WGS84_CRS +from rio_tiler.io import XarrayReader +from rio_tiler.models import ImageData + +feat = { + "type": "Feature", + "properties": {}, + "geometry": { + "type": "Polygon", + "coordinates": [ + [ + [-54.45, 73.05], + [-55.05, 72.79], + [-55.61, 72.46], + [-53.83, 72.36], + [-54.45, 73.05], + ] + ], + }, +} + +with XarrayReader(data) as src: + # src.part(geojson_feature, **kwargs) + img = src.feature(feat) + assert isinstance(img, ImageData) + assert img.crs == WGS84_CRS + assert img.bounds == (-55.61, 72.36, -53.83, 73.05) # bbox of the input feature + +# Pass bbox in WGS84 (default) but return data in the input dataset CRS +with XarrayReader(data) as src: + img = src.feature(feat, dst_crs=src.dataset.crs) + assert img.crs == src.dataset.crs +``` + +- **point()**: Read the pixel values of a DataArray for a given `lon, lat` coordinates. By default the coordinates are considered to be in WGS84. + +```python +from rio_tiler.io import XarrayReader +from rio_tiler.models import PointData + +with XarrayReader(data) as src: + # src.point(lon, lat, coord_crs) + pt = src.point(-100, 25) + assert isinstance(pt, PointData) +``` + +- **info()**: Return simple metadata about the DataArray + +```python +from rio_tiler.io import XarrayReader +from rio_tiler.models import Info + +with XarrayReader(data) as src: + info = src.info() + assert isinstance(info, Info) + +print(info.json(exclude_none=True)) +>>> { + "bounds": [-175.0, -82.5, 175.0, 82.5], + "minzoom": 0, + "maxzoom": 0, + "band_metadata": [["b1", {}]], + "band_descriptions": [["b1", "2022-01-01T00:00:00.000000000"]], + "dtype": "float64", + "nodata_type": "None", + "width": 35, + "attrs": { + "valid_min": -3.148671506292848, + "valid_max": 4.214148915352746 + }, + "count": 1, + "height": 33 +} +``` + +- **preview()**: + +!!! Important + + Not Implemented + + +- **statistics()**: + +!!! Important + + Not Implemented +``` diff --git a/docs/src/supported_format.md b/docs/src/supported_format.md index 1bd88d39..84d3442b 100644 --- a/docs/src/supported_format.md +++ b/docs/src/supported_format.md @@ -1,7 +1,7 @@ `rio-tiler` can work with all raster formats supported by [GDAL](https://gdal.org). That's being said, `rio-tiler` works better with data format that supports **partial reading**, like [Cloud Optimized GeoTIFF](http://cogeo.org). -On interesting feature of Cloud Optimized GeoTIFF is the internal overviews which enable fast preview of the data. For example, when using the `COGReader.preview` method, rio-tiler will only fetch the internal overviews instead of the whole data, to be able to construct the output array. Doing this reduce the amount of data transfer and thus increase the process speed. +On interesting feature of Cloud Optimized GeoTIFF is the internal overviews which enable fast preview of the data. For example, when using the `Reader.preview` method, rio-tiler will only fetch the internal overviews instead of the whole data, to be able to construct the output array. Doing this reduce the amount of data transfer and thus increase the process speed. ### VRT @@ -11,3 +11,14 @@ GDAL's [Virtual format](https://gdal.org/drivers/raster/vrt.html#raster-vrt) is Map Tile reading from VRT might not be efficient if overviews are not present, because GDAL will try to open a lot of files. ![](img/vrt_tile.png) + + +### Xarray + +!!! info "New in version 4.0" + +When `xarray` and `rioxarray` are installed in your environment, you can use `rio_tiler.io.XarrayReader` to read `xarray.DataArray` using the *usual* rio-tiler's Readers methods (`part()`, `tile()`, `feature()`). + +!!! warnings + - Datarray must be fully geo-referenced with a CRS and X,Y variables (longitude, latitude) + - Performance is largely dependant on the chunking of the array diff --git a/docs/src/v4_migration.md b/docs/src/v4_migration.md new file mode 100644 index 00000000..4e57670e --- /dev/null +++ b/docs/src/v4_migration.md @@ -0,0 +1,326 @@ + +# Breaking changes + +`rio-tiler` version 4.0 introduced [many breaking changes](release-notes.md). This +document aims to help with migrating your code to use `rio-tiler` 4.0. + +## Python >=3.8 + +As for rasterio, we removed python 3.7 support (https://github.com/rasterio/rasterio/issues/2445) + +## *COG*Reader -> **Reader** + +Because the main reader will not only work with COG but most of GDAL supported raster, we choose to rename it to `Reader`. + +```python +# before +from rio_tiler.io import COGReader +from rio_tiler.io.cogeo import COGReader + +# now +from rio_tiler.io import Reader +from rio_tiler.io.rasterio import Reader +``` + +Note: We created `rio_tiler.io.COGReader` alias to `Reader` for compatibility. + +## rio_tiler.io.cogeo -> rio_tiler.io.**rasterio** + +Reader's submodule now reflect the backend they use (rasterio, xarray, stac, ...) + +```python +# before +from rio_tiler.io.cogeo import COGReader + +# now +from rio_tiler.io.rasterio import Reader +``` + +## **Band names** + +Band names are now prefixed with `b` (e.g `b1`, `b2`) + +```python +# before +with COGReader( + "http://oin-hotosm.s3.amazonaws.com/5a95f32c2553e6000ce5ad2e/0/10edab38-1bdd-4c06-b83d-6e10ac532b7d.tif" +) as src: + stats = src.statistics() + print(list(stats)) + >>> ["1", "2", "3"] + + info = src.info() + print(info.band_metadata) + >>> [("1", {}), ("2", {}), ("3", {})] + + print(info.band_descriptions) + >>> [("1", ""), ("2", ""), ("3", "")] + +# now +with Reader( + "http://oin-hotosm.s3.amazonaws.com/5a95f32c2553e6000ce5ad2e/0/10edab38-1bdd-4c06-b83d-6e10ac532b7d.tif" +) as src: + stats = src.statistics() + print(list(stats)) + >>> ["b1", "b2", "b3"] + + info = src.info() + print(info.band_metadata) + >>> [("b1", {}), ("b2", {}), ("b3", {})] + + print(info.band_descriptions) + >>> [("b1", ""), ("b2", ""), ("b3", "")] +``` + +## MultiBaseReader **Expressions** + +We updated the `expression` format for `MultiBaseReader` (e.g STAC) to include **band names** and not only the asset name + +```python +# before +with STACReader("stac.json") as stac: + stac.tile(701, 102, 8, expression="green/red") + +# now +with STACReader("stac.json") as stac: + stac.tile(701, 102, 8, expression="green_b1/red_b1") +``` + +In addition we also removed `asset_expression` option in `MultiBaseReader`. This can be achieved directly using expression. + +```python +# before +with STACReader(stac_url, exclude_assets={"thumbnail"},) as stac: + img = stac.tile( + 145, + 103, + 8, + tilesize=256, + assets=["B01", "B02"], + asset_expression={ + "B01": "b1+500", # add 500 to the first band + "B02": "b1-100", # substract 100 to the first band + } + ) + +# now +with STACReader(stac_url, exclude_assets={"thumbnail"},) as stac: + img = stac.tile( + 145, + 103, + 8, + tilesize=256, + expression="B01_b1+500;B02_b1-100", + ) +``` + +## No more GCPCOGReader + +`rio_tiler.io.Reader` will now recognize if the files has internal GCPS. + +```python +# before +from rio_tiler.io import GCPCOGReader + +with GCPCOGReader("my_tif_with_gcps.tif") as src: + pass + +# now +from rio_tiler.io import Reader + +with Reader("my_tif_with_gcps.tif") as src: + pass +``` + +## **PointData** object + +As for method returning `images`, methods returning point values (`Reader.point()`) now return a `PointData` object. + +```python +# before +with COGReader("cog.tif") as cog: + print(cog.point(10.20, -42.0)) + >>> [0, 0, 0] + +# now +with Reader("cog.tif") as cog: + print(cog.point(10.20, -42.0)) + >>> PointData( + data=array([3744], dtype=uint16), + mask=array([255], dtype=uint8), + band_names=['b1'], + coordinates=(10.20, -42), + crs=CRS.from_epsg(4326), + assets=['cog.tif'], + metadata={} + ) +``` + +## Low-level reader methods return ImageData and PointData objects + +`rio_tiler.reader.read` and `rio_tiler.readers.part` now return `ImageData` object instead of `Tuple[ndarray, ndarray]`. + +```python +from rio_tiler.reader import read, part, point +from rio_tiler.models import ImageData, PointData + +# before +with rasterio.open("image.tif") as src: + data, mask = read(src) + pts = point(10.20, -42.0) + print(pts) + >>> [0, 0, 0] + +# now +with rasterio.open("image.tif") as src: + img = read(src) + assert isinstance(img, ImageData) + + pts = point(src, (10.20, -42.0)) + assert isinstance(pts, PointData) + print(pts) + >>> PointData( + data=array([3744], dtype=uint16), + mask=array([255], dtype=uint8), + band_names=['b1'], + coordinates=(10.20, -42), + crs=CRS.from_epsg(4326), + assets=['cog.tif'], + metadata={} + ) +``` + +## **Reader** options + +We removed `nodata`, `unscale`, `resampling_method`, `vrt_options` and `post_process` options to `rio_tiler.io.Reader` init method and replaced with a global `options`: +```python +# before +with COGReader("cog.tif", nodata=1, resampling_method="bilinear") as cog: + data = cog.preview() + +# now +with Reader(COGEO, options={"nodata": 1, "resampling_method": "bilinear"}) as cog: + data = cog.preview() +``` + +## Base classes **minzoom** and **maxzoom** + +We moved min/max zoom attribute from the `SpatialMixin` to the base classes definition directly. This means that each class should now take care of the definition of those two variables. + +```python +# before +@attr.s +class BandFileReader(MultiBandReader): + """Test MultiBand""" + + input: str = attr.ib() + tms: morecantile.TileMatrixSet = attr.ib(default=WEB_MERCATOR_TMS) + + reader: Type[BaseReader] = attr.ib(init=False, default=Reader) + reader_options: Dict = attr.ib(factory=dict) + + def __attrs_post_init__(self): + ... + +# now +@attr.s +class BandFileReader(MultiBandReader): + """Test MultiBand""" + + input: str = attr.ib() + tms: morecantile.TileMatrixSet = attr.ib(default=WEB_MERCATOR_TMS) + + reader: Type[BaseReader] = attr.ib(init=False, default=Reader) + reader_options: Dict = attr.ib(factory=dict) + + minzoom: int = attr.ib() + maxzoom: int = attr.ib() + + @minzoom.default + def _minzoom(self): + return self.tms.minzoom + + @maxzoom.default + def _maxzoom(self): + return self.tms.maxzoom + + def __attrs_post_init__(self): + ... +``` + +# New Features + +## Non-Geo reader + +Because not all raster are geo-referenced, we added `rio_tiler.io.ImageReader` to allow opening and reading non-geo images. All methods are returning data in the pixel coordinate system. + +```python +with ImageReader("image.jpg") as src: + info = src.info() + + stats = src.statistics() + + # Part of the image (Origin is top-lef, coordinates should be in form of (left, bottom, right, top)) + im = src.part((0, 100, 100, 0)) + + # 256x256 Tile (Origin of the TMS is top-lef) + im = src.tile(0, 0, src.maxzoom) + + # read pixel x=10, y=5 (Origin is top-left) + pt = src.point(10, 5) +``` + +## Xarray reader + +We added an *optional* xarray compatible reader in rio-tiler v4.0. The reader takes a xarray.DataArray as input which should have a CRS and geo-spatial variables (x,y or longitude,latitude). + +```python +import rioxarray +import xarray +from rio_tiler.io import XarrayReader + +with xarray.open_dataset( + "https://ncsa.osn.xsede.org/Pangeo/pangeo-forge/noaa-coastwatch-geopolar-sst-feedstock/noaa-coastwatch-geopolar-sst.zarr", + engine="zarr", + decode_coords="all" +) as src: + ds = src["analysed_sst"][:1] + # the SST dataset do not have a CRS info + # so we need to add it to `virtualy` within the Xarray DataArray + ds.rio.write_crs("epsg:4326", inplace=True) + + with XarrayReader(ds) as dst: + print(dst.info()) + img = dst.tile(1, 1, 2) +``` + +Note: Users might experience some really bad performance depending on the chunking of the original zarr. + +## Dataset Statistics + +Starting with rio-tiler 4.0, if the input dataset has [`statistics`](https://gdal.org/user/raster_data_model.html#raster-band) (e.g `STATISTICS_MINIMUM`, `STATISTICS_MAXIMUM`) within its metadata, rio-tiler will try to use it to rescale automatically the output image. + +```python +from rio_tiler.io import Reader + +with Reader("https://data.geo.admin.ch/ch.swisstopo.swissalti3d/swissalti3d_2019_2573-1085/swissalti3d_2019_2573-1085_0.5_2056_5728.tif") as src: + info = src.info() + print(info.band_metadata) + >>> [('b1', + {'STATISTICS_COVARIANCES': '10685.98787505646', + 'STATISTICS_EXCLUDEDVALUES': '-9999', + 'STATISTICS_MAXIMUM': '2015.0944824219', + 'STATISTICS_MEAN': '1754.471184271', + 'STATISTICS_MINIMUM': '1615.8128662109', + 'STATISTICS_SKIPFACTORX': '1', + 'STATISTICS_SKIPFACTORY': '1', + 'STATISTICS_STDDEV': '103.37305197708'})] + + img = src.preview() + # The min/max statistics are saved within every output image object + print(img.dataset_statistics) + >>> [(1615.8128662109, 2015.0944824219)] + + buffer = img.render() + >>> rio-tiler/rio_tiler/models.py:516: InvalidDatatypeWarning: Invalid type: `float32` for the `PNG` driver. Data will be rescaled using min/max type bounds or dataset_statistics. +``` diff --git a/pyproject.toml b/pyproject.toml index 66740332..1522029e 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -2,7 +2,7 @@ name = "rio-tiler" description = "User friendly Rasterio plugin to read raster datasets." readme = "README.md" -requires-python = ">=3.7" +requires-python = ">=3.8" license = {file = "LICENSE"} authors = [ {name = "Vincent Sarago", email = "vincent@developmentseed.com"}, @@ -12,9 +12,9 @@ classifiers = [ "Intended Audience :: Information Technology", "Intended Audience :: Science/Research", "License :: OSI Approved :: BSD License", - "Programming Language :: Python :: 3.7", "Programming Language :: Python :: 3.8", "Programming Language :: Python :: 3.9", + "Programming Language :: Python :: 3.10", "Topic :: Scientific/Engineering :: GIS", ] dynamic = ["version"] @@ -28,7 +28,7 @@ dependencies = [ "morecantile>=3.1,<4.0", "pydantic", "pystac>=0.5.4", - "rasterio>=1.1.7", + "rasterio>=1.3.0", "rio-color", "importlib_resources>=1.1.0; python_version < '3.9'", ] @@ -39,10 +39,18 @@ test = [ "pytest-asyncio", "pytest-benchmark", "pytest-cov", + + # XarrayReader + "xarray", + "rioxarray", ] dev = [ "pre-commit", ] +xarray = [ + "xarray", + "rioxarray", +] docs = [ "nbconvert", "mkdocs", diff --git a/rio_tiler/colormap.py b/rio_tiler/colormap.py index 0d3900f6..4e6afc5e 100644 --- a/rio_tiler/colormap.py +++ b/rio_tiler/colormap.py @@ -8,13 +8,18 @@ import attr import numpy -from .errors import ( +from rio_tiler.errors import ( ColorMapAlreadyRegistered, InvalidColorFormat, InvalidColorMapName, InvalidFormat, ) -from .types import ColorMapType, DataMaskType, GDALColorMapType, IntervalColorMapType +from rio_tiler.types import ( + ColorMapType, + DataMaskType, + GDALColorMapType, + IntervalColorMapType, +) try: from importlib.resources import files as resources_files # type: ignore diff --git a/rio_tiler/constants.py b/rio_tiler/constants.py index 78cebc3e..e96430a9 100644 --- a/rio_tiler/constants.py +++ b/rio_tiler/constants.py @@ -6,7 +6,7 @@ import morecantile from rasterio.crs import CRS -from .types import BBox, ColorTuple, Indexes, NoData, NumType # noqa +from rio_tiler.types import BBox, ColorTuple, Indexes, NoData, NumType # noqa MAX_THREADS = int( os.environ.get("RIO_TILER_MAX_THREADS", multiprocessing.cpu_count() * 5) diff --git a/rio_tiler/errors.py b/rio_tiler/errors.py index f51bb027..326a66b2 100644 --- a/rio_tiler/errors.py +++ b/rio_tiler/errors.py @@ -13,8 +13,8 @@ class TileOutsideBounds(RioTilerError): """Z-X-Y Tile is outside image bounds.""" -class IncorrectTileBuffer(RioTilerError): - """Tile buffer is a float but not half of an integer""" +class InvalidBufferSize(RioTilerError): + "`buffer` must be a multiple of `0.5` (e.g: 0.5, 1, 1.5, ...)." class PointOutsideBounds(RioTilerError): diff --git a/rio_tiler/expression.py b/rio_tiler/expression.py index 7b33c868..d733be08 100644 --- a/rio_tiler/expression.py +++ b/rio_tiler/expression.py @@ -2,7 +2,7 @@ import re import warnings -from typing import List, Sequence, Tuple, Union +from typing import List, Sequence, Tuple import numexpr import numpy @@ -59,7 +59,7 @@ def get_expression_blocks(expression: str) -> List[str]: def apply_expression( blocks: Sequence[str], - bands: Sequence[Union[str, int]], + bands: Sequence[str], data: numpy.ndarray, ) -> numpy.ndarray: """Apply rio-tiler expression. @@ -74,6 +74,11 @@ def apply_expression( numpy.array: output data. """ + if len(bands) != data.shape[0]: + raise ValueError( + f"Incompatible number of bands ({bands}) and data shape {data.shape}" + ) + return numpy.array( [ numpy.nan_to_num( diff --git a/rio_tiler/io/__init__.py b/rio_tiler/io/__init__.py index 2ccea3ad..43b6c801 100644 --- a/rio_tiler/io/__init__.py +++ b/rio_tiler/io/__init__.py @@ -1,5 +1,9 @@ """rio-tiler.io""" -from .base import AsyncBaseReader, BaseReader, MultiBandReader, MultiBaseReader # noqa -from .cogeo import COGReader, GCPCOGReader # noqa +from .base import BaseReader, MultiBandReader, MultiBaseReader # noqa +from .rasterio import ImageReader, Reader # noqa from .stac import STACReader # noqa +from .xarray import XarrayReader # noqa + +# Keep Compatibility with <4.0 +COGReader = Reader diff --git a/rio_tiler/io/base.py b/rio_tiler/io/base.py index 37fdf2f6..966322fb 100644 --- a/rio_tiler/io/base.py +++ b/rio_tiler/io/base.py @@ -3,7 +3,7 @@ import abc import re import warnings -from typing import Any, Coroutine, Dict, List, Optional, Sequence, Tuple, Type, Union +from typing import Any, Dict, List, Optional, Sequence, Tuple, Type, Union import attr import numpy @@ -11,18 +11,24 @@ from rasterio.crs import CRS from rasterio.warp import transform_bounds -from ..constants import WEB_MERCATOR_TMS, WGS84_CRS -from ..errors import ( +from rio_tiler.constants import WEB_MERCATOR_TMS, WGS84_CRS +from rio_tiler.errors import ( ExpressionMixingWarning, MissingAssets, MissingBands, TileOutsideBounds, ) -from ..expression import apply_expression, get_expression_blocks -from ..models import BandStatistics, ImageData, Info -from ..tasks import multi_arrays, multi_values -from ..types import BBox, Indexes -from ..utils import get_array_statistics +from rio_tiler.models import BandStatistics, ImageData, Info, PointData +from rio_tiler.tasks import multi_arrays, multi_points, multi_values +from rio_tiler.types import BBox, Indexes +from rio_tiler.utils import get_array_statistics, normalize_bounds + + +def _AssetExpressionWarning(): + warnings.warn( + "asset_expression is deprecated and will be removed in 4.0. Use pure Expression", + DeprecationWarning, + ) @attr.s @@ -31,19 +37,11 @@ class SpatialMixin: Attributes: tms (morecantile.TileMatrixSet, optional): TileMatrixSet grid definition. Defaults to `WebMercatorQuad`. - minzoom (int): Dataset Min Zoom level. **Not in __init__**. - maxzoom (int): Dataset Max Zoom level. **Not in __init__**. - bounds (tuple): Dataset bounds (left, bottom, right, top). **Not in __init__**. - crs (rasterio.crs.CRS): Dataset crs. **Not in __init__**. - geographic_crs (rasterio.crs.CRS): CRS to use as geographic coordinate system. Defaults to WGS84. **Not in __init__**. """ tms: TileMatrixSet = attr.ib(default=WEB_MERCATOR_TMS) - minzoom: int = attr.ib(init=False) - maxzoom: int = attr.ib(init=False) - bounds: BBox = attr.ib(init=False) crs: CRS = attr.ib(init=False) @@ -51,7 +49,7 @@ class SpatialMixin: @property def geographic_bounds(self) -> BBox: - """return bounds in WGS84.""" + """Return dataset bounds in geographic_crs.""" if self.crs == self.geographic_crs: return self.bounds @@ -64,7 +62,7 @@ def geographic_bounds(self) -> BBox: ) except: # noqa warnings.warn( - "Cannot dertermine bounds in geographic CRS, will default to (-180.0, -90.0, 180.0, 90.0).", + "Cannot determine bounds in geographic CRS, will default to (-180.0, -90.0, 180.0, 90.0).", UserWarning, ) bounds = (-180.0, -90, 180.0, 90) @@ -117,17 +115,26 @@ def tile_exists(self, tile_x: int, tile_y: int, tile_z: int) -> bool: if not all(numpy.isfinite(tile_bounds)): return True + tile_bounds = normalize_bounds(tile_bounds) + dst_bounds = normalize_bounds(self.bounds) + return ( - (tile_bounds[0] < self.bounds[2]) - and (tile_bounds[2] > self.bounds[0]) - and (tile_bounds[3] > self.bounds[1]) - and (tile_bounds[1] < self.bounds[3]) + (tile_bounds[0] < dst_bounds[2]) + and (tile_bounds[2] > dst_bounds[0]) + and (tile_bounds[3] > dst_bounds[1]) + and (tile_bounds[1] < dst_bounds[3]) ) @attr.s class BaseReader(SpatialMixin, metaclass=abc.ABCMeta): - """Rio-tiler.io BaseReader.""" + """Rio-tiler.io BaseReader. + + Attributes: + input (any): Reader's input. + tms (morecantile.TileMatrixSet, optional): TileMatrixSet grid definition. Defaults to `WebMercatorQuad`. + + """ input: Any = attr.ib() tms: TileMatrixSet = attr.ib(default=WEB_MERCATOR_TMS) @@ -151,111 +158,7 @@ def info(self) -> Info: ... @abc.abstractmethod - def statistics(self, **kwargs: Any) -> Dict[str, BandStatistics]: - """Return bands statistics from a dataset. - - Returns: - Dict[str, rio_tiler.models.BandStatistics]: bands statistics. - - """ - ... - - @abc.abstractmethod - def tile(self, tile_x: int, tile_y: int, tile_z: int, **kwargs: Any) -> ImageData: - """Read a Map tile from the Dataset. - - Args: - tile_x (int): Tile's horizontal index. - tile_y (int): Tile's vertical index. - tile_z (int): Tile's zoom level index. - - Returns: - rio_tiler.models.ImageData: ImageData instance with data, mask and tile spatial info. - - """ - ... - - @abc.abstractmethod - def part(self, bbox: BBox, **kwargs: Any) -> ImageData: - """Read a Part of a Dataset. - - Args: - bbox (tuple): Output bounds (left, bottom, right, top) in target crs. - - Returns: - rio_tiler.models.ImageData: ImageData instance with data, mask and input spatial info. - - """ - ... - - @abc.abstractmethod - def preview(self, **kwargs: Any) -> ImageData: - """Read a preview of a Dataset. - - Returns: - rio_tiler.models.ImageData: ImageData instance with data, mask and input spatial info. - - """ - ... - - @abc.abstractmethod - def point(self, lon: float, lat: float, **kwargs: Any) -> List: - """Read a value from a Dataset. - - Args: - lon (float): Longitude. - lat (float): Latitude. - - Returns: - list: Pixel value per bands/assets. - - """ - ... - - @abc.abstractmethod - def feature(self, shape: Dict, **kwargs: Any) -> ImageData: - """Read a Dataset for a GeoJSON feature. - - Args: - shape (dict): Valid GeoJSON feature. - - Returns: - rio_tiler.models.ImageData: ImageData instance with data, mask and input spatial info. - - """ - ... - - -@attr.s -class AsyncBaseReader(SpatialMixin, metaclass=abc.ABCMeta): - """Rio-tiler.io AsyncBaseReader.""" - - input: Any = attr.ib() - tms: TileMatrixSet = attr.ib(default=WEB_MERCATOR_TMS) - - async def __aenter__(self): - """Support using with Context Managers.""" - return self - - async def __aexit__(self, exc_type, exc_value, traceback): - """Support using with Context Managers.""" - pass - - @abc.abstractmethod - async def info(self) -> Coroutine[Any, Any, Info]: - """Return Dataset's info. - - Returns: - rio_tile.models.Info: Dataset info. - - """ - ... - - @abc.abstractmethod - async def statistics( - self, - **kwargs: Any, - ) -> Coroutine[Any, Any, Dict[str, BandStatistics]]: + def statistics(self) -> Dict[str, BandStatistics]: """Return bands statistics from a dataset. Returns: @@ -265,9 +168,7 @@ async def statistics( ... @abc.abstractmethod - async def tile( - self, tile_x: int, tile_y: int, tile_z: int, **kwargs: Any - ) -> Coroutine[Any, Any, ImageData]: + def tile(self, tile_x: int, tile_y: int, tile_z: int) -> ImageData: """Read a Map tile from the Dataset. Args: @@ -282,7 +183,7 @@ async def tile( ... @abc.abstractmethod - async def part(self, bbox: BBox, **kwargs: Any) -> Coroutine[Any, Any, ImageData]: + def part(self, bbox: BBox) -> ImageData: """Read a Part of a Dataset. Args: @@ -295,7 +196,7 @@ async def part(self, bbox: BBox, **kwargs: Any) -> Coroutine[Any, Any, ImageData ... @abc.abstractmethod - async def preview(self, **kwargs: Any) -> Coroutine[Any, Any, ImageData]: + def preview(self) -> ImageData: """Read a preview of a Dataset. Returns: @@ -305,9 +206,7 @@ async def preview(self, **kwargs: Any) -> Coroutine[Any, Any, ImageData]: ... @abc.abstractmethod - async def point( - self, lon: float, lat: float, **kwargs: Any - ) -> Coroutine[Any, Any, List]: + def point(self, lon: float, lat: float) -> PointData: """Read a value from a Dataset. Args: @@ -315,15 +214,13 @@ async def point( lat (float): Latitude. Returns: - list: Pixel value per bands/assets. + rio_tiler.models.PointData: PointData instance with data, mask and spatial info. """ ... @abc.abstractmethod - async def feature( - self, shape: Dict, **kwargs: Any - ) -> Coroutine[Any, Any, ImageData]: + def feature(self, shape: Dict) -> ImageData: """Read a Dataset for a GeoJSON feature. Args: @@ -345,17 +242,21 @@ class MultiBaseReader(SpatialMixin, metaclass=abc.ABCMeta): Attributes: input (any): input data. tms (morecantile.TileMatrixSet, optional): TileMatrixSet grid definition. Defaults to `WebMercatorQuad`. + minzoom (int, optional): Set dataset's minzoom. + maxzoom (int, optional): Set dataset's maxzoom. reader_options (dict, option): options to forward to the reader. Defaults to `{}`. - reader (rio_tiler.io.BaseReader): reader. **Not in __init__**. - assets (sequence): Asset list. **Not in __init__**. """ input: Any = attr.ib() tms: TileMatrixSet = attr.ib(default=WEB_MERCATOR_TMS) - reader_options: Dict = attr.ib(factory=dict) + + minzoom: int = attr.ib(default=None) + maxzoom: int = attr.ib(default=None) reader: Type[BaseReader] = attr.ib(init=False) + reader_options: Dict = attr.ib(factory=dict) + assets: Sequence[str] = attr.ib(init=False) def __enter__(self): @@ -373,11 +274,11 @@ def _get_asset_url(self, asset: str) -> str: def parse_expression(self, expression: str) -> Tuple: """Parse rio-tiler band math expression.""" - assets = "|".join([rf"\b{asset}\b" for asset in self.assets]) - _re = re.compile(assets.replace("\\\\", "\\")) + assets = "|".join(self.assets) + _re = re.compile(rf"\b({assets})_b\d+\b") return tuple(set(re.findall(_re, expression))) - def info( # type: ignore + def info( self, assets: Union[Sequence[str], str] = None, **kwargs: Any ) -> Dict[str, Info]: """Return metadata from multiple assets. @@ -407,7 +308,7 @@ def _reader(asset: str, **kwargs: Any) -> Dict: return multi_values(assets, _reader, **kwargs) - def statistics( # type: ignore + def statistics( self, assets: Union[Sequence[str], str] = None, asset_indexes: Optional[Dict[str, Indexes]] = None, # Indexes for each asset @@ -452,7 +353,7 @@ def _reader(asset: str, *args, **kwargs) -> Dict: return multi_values(assets, _reader, **kwargs) - def merged_statistics( # type: ignore + def merged_statistics( self, assets: Union[Sequence[str], str] = None, expression: Optional[str] = None, @@ -471,7 +372,7 @@ def merged_statistics( # type: ignore assets (sequence of str or str): assets to fetch info from. expression (str, optional): rio-tiler expression for the asset list (e.g. asset1/asset2+asset3). asset_indexes (dict, optional): Band indexes for each asset (e.g {"asset1": 1, "asset2": (1, 2,)}). - asset_expression (dict, optional): rio-tiler expression for each asset (e.g. {"asset1": "b1/b2+b3", "asset2": ...}). + asset_expression (dict, optional): rio-tiler expression for each asset (e.g. {"asset1": "b1/b2+b3", "asset2": ...}). **Deprecated** categorical (bool): treat input data as categorical data. Defaults to False. categories (list of numbers, optional): list of categories to return value for. percentiles (list of numbers, optional): list of percentile values to calculate. Defaults to `[2, 98]`. @@ -484,6 +385,9 @@ def merged_statistics( # type: ignore Dict[str, rio_tiler.models.BandStatistics]: bands statistics. """ + if asset_expression: + _AssetExpressionWarning() + if not expression: if not assets: warnings.warn( @@ -496,7 +400,6 @@ def merged_statistics( # type: ignore assets=assets, expression=expression, asset_indexes=asset_indexes, - asset_expression=asset_expression, max_size=max_size, **kwargs, ) @@ -536,13 +439,16 @@ def tile( assets (sequence of str or str, optional): assets to fetch info from. expression (str, optional): rio-tiler expression for the asset list (e.g. asset1/asset2+asset3). asset_indexes (dict, optional): Band indexes for each asset (e.g {"asset1": 1, "asset2": (1, 2,)}). - asset_expression (dict, optional): rio-tiler expression for each asset (e.g. {"asset1": "b1/b2+b3", "asset2": ...}). + asset_expression (dict, optional): rio-tiler expression for each asset (e.g. {"asset1": "b1/b2+b3", "asset2": ...}). **Deprecated** kwargs (optional): Options to forward to the `self.reader.tile` method. Returns: rio_tiler.models.ImageData: ImageData instance with data, mask and tile spatial info. """ + if asset_expression: + _AssetExpressionWarning() + if not self.tile_exists(tile_x, tile_y, tile_z): raise TileOutsideBounds( f"Tile {tile_z}/{tile_x}/{tile_y} is outside image bounds" @@ -566,35 +472,20 @@ def tile( ) asset_indexes = asset_indexes or {} - asset_expression = asset_expression or {} def _reader(asset: str, *args: Any, **kwargs: Any) -> ImageData: url = self._get_asset_url(asset) + idx = asset_indexes.get(asset) or kwargs.pop("indexes", None) # type: ignore with self.reader(url, tms=self.tms, **self.reader_options) as cog: # type: ignore - data = cog.tile( - *args, - indexes=asset_indexes.get(asset, kwargs.pop("indexes", None)), # type: ignore - expression=asset_expression.get(asset), # type: ignore - **kwargs, - ) + data = cog.tile(*args, indexes=idx, **kwargs) data.band_names = [f"{asset}_{n}" for n in data.band_names] return data - output = multi_arrays( - assets, - _reader, - tile_x, - tile_y, - tile_z, - **kwargs, - ) - + img = multi_arrays(assets, _reader, tile_x, tile_y, tile_z, **kwargs) if expression: - blocks = get_expression_blocks(expression) - output.data = apply_expression(blocks, assets, output.data) - output.band_names = blocks + return img.apply_expression(expression) - return output + return img def part( self, @@ -612,13 +503,16 @@ def part( assets (sequence of str or str, optional): assets to fetch info from. expression (str, optional): rio-tiler expression for the asset list (e.g. asset1/asset2+asset3). asset_indexes (dict, optional): Band indexes for each asset (e.g {"asset1": 1, "asset2": (1, 2,)}). - asset_expression (dict, optional): rio-tiler expression for each asset (e.g. {"asset1": "b1/b2+b3", "asset2": ...}). + asset_expression (dict, optional): rio-tiler expression for each asset (e.g. {"asset1": "b1/b2+b3", "asset2": ...}). **Deprecated** kwargs (optional): Options to forward to the `self.reader.part` method. Returns: rio_tiler.models.ImageData: ImageData instance with data, mask and tile spatial info. """ + if asset_expression: + _AssetExpressionWarning() + if isinstance(assets, str): assets = (assets,) @@ -637,28 +531,20 @@ def part( ) asset_indexes = asset_indexes or {} - asset_expression = asset_expression or {} def _reader(asset: str, *args: Any, **kwargs: Any) -> ImageData: url = self._get_asset_url(asset) + idx = asset_indexes.get(asset) or kwargs.pop("indexes", None) # type: ignore with self.reader(url, tms=self.tms, **self.reader_options) as cog: # type: ignore - data = cog.part( - *args, - indexes=asset_indexes.get(asset, kwargs.pop("indexes", None)), # type: ignore - expression=asset_expression.get(asset), # type: ignore - **kwargs, - ) + data = cog.part(*args, indexes=idx, **kwargs) data.band_names = [f"{asset}_{n}" for n in data.band_names] return data - output = multi_arrays(assets, _reader, bbox, **kwargs) - + img = multi_arrays(assets, _reader, bbox, **kwargs) if expression: - blocks = get_expression_blocks(expression) - output.data = apply_expression(blocks, assets, output.data) - output.band_names = blocks + return img.apply_expression(expression) - return output + return img def preview( self, @@ -674,13 +560,16 @@ def preview( assets (sequence of str or str, optional): assets to fetch info from. expression (str, optional): rio-tiler expression for the asset list (e.g. asset1/asset2+asset3). asset_indexes (dict, optional): Band indexes for each asset (e.g {"asset1": 1, "asset2": (1, 2,)}). - asset_expression (dict, optional): rio-tiler expression for each asset (e.g. {"asset1": "b1/b2+b3", "asset2": ...}). + asset_expression (dict, optional): rio-tiler expression for each asset (e.g. {"asset1": "b1/b2+b3", "asset2": ...}). **Deprecated** kwargs (optional): Options to forward to the `self.reader.preview` method. Returns: rio_tiler.models.ImageData: ImageData instance with data, mask and tile spatial info. """ + if asset_expression: + _AssetExpressionWarning() + if isinstance(assets, str): assets = (assets,) @@ -699,27 +588,20 @@ def preview( ) asset_indexes = asset_indexes or {} - asset_expression = asset_expression or {} def _reader(asset: str, **kwargs: Any) -> ImageData: url = self._get_asset_url(asset) + idx = asset_indexes.get(asset) or kwargs.pop("indexes", None) # type: ignore with self.reader(url, tms=self.tms, **self.reader_options) as cog: # type: ignore - data = cog.preview( - indexes=asset_indexes.get(asset, kwargs.pop("indexes", None)), # type: ignore - expression=asset_expression.get(asset), # type: ignore - **kwargs, - ) + data = cog.preview(indexes=idx, **kwargs) data.band_names = [f"{asset}_{n}" for n in data.band_names] return data - output = multi_arrays(assets, _reader, **kwargs) - + img = multi_arrays(assets, _reader, **kwargs) if expression: - blocks = get_expression_blocks(expression) - output.data = apply_expression(blocks, assets, output.data) - output.band_names = blocks + return img.apply_expression(expression) - return output + return img def point( self, @@ -730,7 +612,7 @@ def point( asset_indexes: Optional[Dict[str, Indexes]] = None, # Indexes for each asset asset_expression: Optional[Dict[str, str]] = None, # Expression for each asset **kwargs: Any, - ) -> List: + ) -> PointData: """Read pixel value from multiple assets. Args: @@ -739,13 +621,16 @@ def point( assets (sequence of str or str, optional): assets to fetch info from. expression (str, optional): rio-tiler expression for the asset list (e.g. asset1/asset2+asset3). asset_indexes (dict, optional): Band indexes for each asset (e.g {"asset1": 1, "asset2": (1, 2,)}). - asset_expression (dict, optional): rio-tiler expression for each asset (e.g. {"asset1": "b1/b2+b3", "asset2": ...}). + asset_expression (dict, optional): rio-tiler expression for each asset (e.g. {"asset1": "b1/b2+b3", "asset2": ...}). **Deprecated** kwargs (optional): Options to forward to the `self.reader.point` method. Returns: - list: Pixel values per assets. + PointData """ + if asset_expression: + _AssetExpressionWarning() + if isinstance(assets, str): assets = (assets,) @@ -764,26 +649,20 @@ def point( ) asset_indexes = asset_indexes or {} - asset_expression = asset_expression or {} - def _reader(asset: str, *args, **kwargs: Any) -> Dict: + def _reader(asset: str, *args, **kwargs: Any) -> PointData: url = self._get_asset_url(asset) + idx = asset_indexes.get(asset) or kwargs.pop("indexes", None) # type: ignore with self.reader(url, tms=self.tms, **self.reader_options) as cog: # type: ignore - return cog.point( - *args, - indexes=asset_indexes.get(asset, kwargs.pop("indexes", None)), # type: ignore - expression=asset_expression.get(asset), # type: ignore - **kwargs, - ) - - data = multi_values(assets, _reader, lon, lat, **kwargs) + data = cog.point(*args, indexes=idx, **kwargs) + data.band_names = [f"{asset}_{n}" for n in data.band_names] + return data - values = [numpy.array(d) for _, d in data.items()] + data = multi_points(assets, _reader, lon, lat, **kwargs) if expression: - blocks = get_expression_blocks(expression) - values = apply_expression(blocks, assets, values) + return data.apply_expression(expression) - return [v.tolist() for v in values] + return data def feature( self, @@ -801,13 +680,16 @@ def feature( assets (sequence of str or str, optional): assets to fetch info from. expression (str, optional): rio-tiler expression for the asset list (e.g. asset1/asset2+asset3). asset_indexes (dict, optional): Band indexes for each asset (e.g {"asset1": 1, "asset2": (1, 2,)}). - asset_expression (dict, optional): rio-tiler expression for each asset (e.g. {"asset1": "b1/b2+b3", "asset2": ...}). + asset_expression (dict, optional): rio-tiler expression for each asset (e.g. {"asset1": "b1/b2+b3", "asset2": ...}). **Deprecated** kwargs (optional): Options to forward to the `self.reader.feature` method. Returns: rio_tiler.models.ImageData: ImageData instance with data, mask and tile spatial info. """ + if asset_expression: + _AssetExpressionWarning() + if isinstance(assets, str): assets = (assets,) @@ -826,28 +708,20 @@ def feature( ) asset_indexes = asset_indexes or {} - asset_expression = asset_expression or {} def _reader(asset: str, *args: Any, **kwargs: Any) -> ImageData: url = self._get_asset_url(asset) + idx = asset_indexes.get(asset) or kwargs.pop("indexes", None) # type: ignore with self.reader(url, tms=self.tms, **self.reader_options) as cog: # type: ignore - data = cog.feature( - *args, - indexes=asset_indexes.get(asset, kwargs.pop("indexes", None)), # type: ignore - expression=asset_expression.get(asset), # type: ignore - **kwargs, - ) + data = cog.feature(*args, indexes=idx, **kwargs) data.band_names = [f"{asset}_{n}" for n in data.band_names] return data - output = multi_arrays(assets, _reader, shape, **kwargs) - + img = multi_arrays(assets, _reader, shape, **kwargs) if expression: - blocks = get_expression_blocks(expression) - output.data = apply_expression(blocks, assets, output.data) - output.band_names = blocks + return img.apply_expression(expression) - return output + return img @attr.s @@ -859,17 +733,21 @@ class MultiBandReader(SpatialMixin, metaclass=abc.ABCMeta): Attributes: input (any): input data. tms (morecantile.TileMatrixSet, optional): TileMatrixSet grid definition. Defaults to `WebMercatorQuad`. + minzoom (int, optional): Set dataset's minzoom. + maxzoom (int, optional): Set dataset's maxzoom. reader_options (dict, option): options to forward to the reader. Defaults to `{}`. - reader (rio_tiler.io.BaseReader): reader. **Not in __init__**. - bands (sequence): Band list. **Not in __init__**. """ input: Any = attr.ib() tms: TileMatrixSet = attr.ib(default=WEB_MERCATOR_TMS) - reader_options: Dict = attr.ib(factory=dict) + + minzoom: int = attr.ib(default=None) + maxzoom: int = attr.ib(default=None) reader: Type[BaseReader] = attr.ib(init=False) + reader_options: Dict = attr.ib(factory=dict) + bands: Sequence[str] = attr.ib(init=False) def __enter__(self): @@ -1049,17 +927,15 @@ def _reader(band: str, *args: Any, **kwargs: Any) -> ImageData: url = self._get_band_url(band) with self.reader(url, tms=self.tms, **self.reader_options) as cog: # type: ignore data = cog.tile(*args, **kwargs) - data.band_names = [band] + data.band_names = [band] # use `band` as name instead of band index return data - output = multi_arrays(bands, _reader, tile_x, tile_y, tile_z, **kwargs) + img = multi_arrays(bands, _reader, tile_x, tile_y, tile_z, **kwargs) if expression: - blocks = get_expression_blocks(expression) - output.data = apply_expression(blocks, bands, output.data) - output.band_names = blocks + return img.apply_expression(expression) - return output + return img def part( self, @@ -1101,17 +977,15 @@ def _reader(band: str, *args: Any, **kwargs: Any) -> ImageData: url = self._get_band_url(band) with self.reader(url, tms=self.tms, **self.reader_options) as cog: # type: ignore data = cog.part(*args, **kwargs) - data.band_names = [band] + data.band_names = [band] # use `band` as name instead of band index return data - output = multi_arrays(bands, _reader, bbox, **kwargs) + img = multi_arrays(bands, _reader, bbox, **kwargs) if expression: - blocks = get_expression_blocks(expression) - output.data = apply_expression(blocks, bands, output.data) - output.band_names = blocks + return img.apply_expression(expression) - return output + return img def preview( self, @@ -1151,17 +1025,15 @@ def _reader(band: str, **kwargs: Any) -> ImageData: url = self._get_band_url(band) with self.reader(url, tms=self.tms, **self.reader_options) as cog: # type: ignore data = cog.preview(**kwargs) - data.band_names = [band] + data.band_names = [band] # use `band` as name instead of band index return data - output = multi_arrays(bands, _reader, **kwargs) + img = multi_arrays(bands, _reader, **kwargs) if expression: - blocks = get_expression_blocks(expression) - output.data = apply_expression(blocks, bands, output.data) - output.band_names = blocks + return img.apply_expression(expression) - return output + return img def point( self, @@ -1170,7 +1042,7 @@ def point( bands: Union[Sequence[str], str] = None, expression: Optional[str] = None, **kwargs: Any, - ) -> List: + ) -> PointData: """Read a pixel values from multiple bands. Args: @@ -1181,7 +1053,7 @@ def point( kwargs (optional): Options to forward to the `self.reader.point` method. Returns: - list: Pixel value per bands. + PointData """ if isinstance(bands, str): @@ -1201,19 +1073,18 @@ def point( "bands must be passed either via expression or bands options." ) - def _reader(band: str, *args, **kwargs: Any) -> Dict: + def _reader(band: str, *args, **kwargs: Any) -> PointData: url = self._get_band_url(band) with self.reader(url, tms=self.tms, **self.reader_options) as cog: # type: ignore - return cog.point(*args, **kwargs)[0] # We only return the first value - - data = multi_values(bands, _reader, lon, lat, **kwargs) + data = cog.point(*args, **kwargs) + data.band_names = [band] # use `band` as name instead of band index + return data - values = [numpy.array(d) for _, d in data.items()] + data = multi_points(bands, _reader, lon, lat, **kwargs) if expression: - blocks = get_expression_blocks(expression) - values = apply_expression(blocks, bands, values) + return data.apply_expression(expression) - return [v.tolist() for v in values] + return data def feature( self, @@ -1255,14 +1126,12 @@ def _reader(band: str, *args: Any, **kwargs: Any) -> ImageData: url = self._get_band_url(band) with self.reader(url, tms=self.tms, **self.reader_options) as cog: # type: ignore data = cog.feature(*args, **kwargs) - data.band_names = [band] + data.band_names = [band] # use `band` as name instead of band index return data - output = multi_arrays(bands, _reader, shape, **kwargs) + img = multi_arrays(bands, _reader, shape, **kwargs) if expression: - blocks = get_expression_blocks(expression) - output.data = apply_expression(blocks, bands, output.data) - output.band_names = blocks + return img.apply_expression(expression) - return output + return img diff --git a/rio_tiler/io/cogeo.py b/rio_tiler/io/rasterio.py similarity index 51% rename from rio_tiler/io/cogeo.py rename to rio_tiler/io/rasterio.py index 6bd9aa07..214ff31e 100644 --- a/rio_tiler/io/cogeo.py +++ b/rio_tiler/io/rasterio.py @@ -1,79 +1,76 @@ -"""rio_tiler.io.cogeo: raster processing.""" +"""rio_tiler.io.rasterio: rio-tiler reader built on top Rasterio""" import contextlib import warnings -from typing import Any, Callable, Dict, List, Optional, Sequence, Tuple, Union +from typing import Any, Callable, Dict, List, Optional, Sequence, Union import attr import numpy import rasterio -from morecantile import BoundingBox, Tile, TileMatrixSet +from affine import Affine +from morecantile import BoundingBox, Coords, Tile, TileMatrixSet +from morecantile.utils import _parse_tile_arg from rasterio import transform from rasterio.crs import CRS from rasterio.enums import Resampling from rasterio.features import bounds as featureBounds +from rasterio.features import geometry_mask from rasterio.io import DatasetReader, DatasetWriter, MemoryFile from rasterio.rio.overview import get_maximum_overview_level +from rasterio.transform import from_bounds as transform_from_bounds from rasterio.vrt import WarpedVRT -from rasterio.warp import calculate_default_transform, transform_bounds +from rasterio.warp import calculate_default_transform +from rasterio.windows import Window +from rasterio.windows import from_bounds as window_from_bounds -from .. import reader -from ..constants import WEB_MERCATOR_TMS, WGS84_CRS -from ..errors import ( +from rio_tiler import reader +from rio_tiler.constants import WEB_MERCATOR_TMS, WGS84_CRS +from rio_tiler.errors import ( ExpressionMixingWarning, - IncorrectTileBuffer, NoOverviewWarning, + PointOutsideBounds, TileOutsideBounds, ) -from ..expression import apply_expression, get_expression_blocks, parse_expression -from ..models import BandStatistics, ImageData, Info -from ..types import BBox, DataMaskType, Indexes, NoData, NumType -from ..utils import ( +from rio_tiler.expression import parse_expression +from rio_tiler.io.base import BaseReader +from rio_tiler.models import BandStatistics, ImageData, Info, PointData +from rio_tiler.types import BBox, DataMaskType, Indexes, NumType +from rio_tiler.utils import ( create_cutline, get_array_statistics, - get_bands_names, has_alpha_band, has_mask_band, ) -from .base import BaseReader @attr.s -class COGReader(BaseReader): - """Cloud Optimized GeoTIFF Reader. +class Reader(BaseReader): + """Rasterio Reader. Attributes: - input (str): Cloud Optimized GeoTIFF path. + input (str): dataset path. dataset (rasterio.io.DatasetReader or rasterio.io.DatasetWriter or rasterio.vrt.WarpedVRT, optional): Rasterio dataset. - bounds (tuple): Dataset bounds (left, bottom, right, top). - crs (rasterio.crs.CRS): Dataset CRS. tms (morecantile.TileMatrixSet, optional): TileMatrixSet grid definition. Defaults to `WebMercatorQuad`. - minzoom (int, optional): Set minzoom for the tiles. - maxzoom (int, optional): Set maxzoom for the tiles. geographic_crs (rasterio.crs.CRS, optional): CRS to use as geographic coordinate system. Defaults to WGS84. colormap (dict, optional): Overwrite internal colormap. - nodata (int or float or str, optional): Global options, overwrite internal nodata value. - unscale (bool, optional): Global options, apply internal scale and offset on all read operations. - resampling_method (rasterio.enums.Resampling, optional): Global options, resampling method to use for read operations. - vrt_options (dict, optional): Global options, WarpedVRT options to use for read operations. - post_process (callable, optional): Global options, Function to apply after all read operations. + options (dict, optional): Options to forward to low-level reader methods. Examples: - >>> with COGReader(src_path) as cog: - cog.tile(...) + >>> with Reader(src_path) as src: + src.tile(...) >>> # Set global options - with COGReader(src_path, unscale=True, nodata=0) as cog: - cog.tile(...) + with Reader(src_path, options={"unscale": True, "nodata": 0}) as src: + src.tile(...) >>> with rasterio.open(src_path) as src_dst: with WarpedVRT(src_dst, ...) as vrt_dst: - with COGReader(None, dataset=vrt_dst) as cog: - cog.tile(...) + with Reader(None, dataset=vrt_dst) as src: + src.tile(...) >>> with rasterio.open(src_path) as src_dst: - with COGReader(None, dataset=src_dst) as cog: - cog.tile(...) + with Reader(None, dataset=src_dst) as src: + src.tile(...) """ @@ -83,42 +80,23 @@ class COGReader(BaseReader): ) tms: TileMatrixSet = attr.ib(default=WEB_MERCATOR_TMS) - minzoom: int = attr.ib(default=None) - maxzoom: int = attr.ib(default=None) - geographic_crs: CRS = attr.ib(default=WGS84_CRS) colormap: Dict = attr.ib(default=None) - # Define global options to be forwarded to functions reading the data (e.g `rio_tiler.reader.read`) - nodata: Optional[NoData] = attr.ib(default=None) - unscale: Optional[bool] = attr.ib(default=None) - resampling_method: Optional[Resampling] = attr.ib(default=None) - vrt_options: Optional[Dict] = attr.ib(default=None) - post_process: Optional[ - Callable[[numpy.ndarray, numpy.ndarray], DataMaskType] - ] = attr.ib(default=None) - - # We use _kwargs to store values of nodata, unscale, vrt_options and resampling_method. - # _kwargs is used avoid having to set those values on each method call. - _kwargs: Dict[str, Any] = attr.ib(init=False, factory=dict) + options: reader.Options = attr.ib() # Context Manager to handle rasterio open/close _ctx_stack = attr.ib(init=False, factory=contextlib.ExitStack) + _minzoom: int = attr.ib(init=False, default=None) + _maxzoom: int = attr.ib(init=False, default=None) + + @options.default + def _options_default(self): + return {} def __attrs_post_init__(self): """Define _kwargs, open dataset and get info.""" - if self.nodata is not None: - self._kwargs["nodata"] = self.nodata - if self.unscale is not None: - self._kwargs["unscale"] = self.unscale - if self.resampling_method is not None: - self._kwargs["resampling_method"] = self.resampling_method - if self.vrt_options is not None: - self._kwargs["vrt_options"] = self.vrt_options - if self.post_process is not None: - self._kwargs["post_process"] = self.post_process - if not self.dataset: dataset = self._ctx_stack.enter_context(rasterio.open(self.input)) if dataset.gcps[0]: @@ -135,11 +113,6 @@ def __attrs_post_init__(self): self.bounds = tuple(self.dataset.bounds) self.crs = self.dataset.crs - self.nodata = self.nodata if self.nodata is not None else self.dataset.nodata - - if self.minzoom is None or self.maxzoom is None: - self._set_zooms() - if self.colormap is None: self._get_colormap() @@ -159,11 +132,11 @@ def __exit__(self, exc_type, exc_value, traceback): """Support using with Context Managers.""" self.close() - def get_zooms(self, tilesize: int = 256) -> Tuple[int, int]: - """Calculate raster min/max zoom level for input TMS.""" - if self.dataset.crs != self.tms.rasterio_crs: + def _dst_geom_in_tms_crs(self): + """Return dataset info in TMS projection.""" + if self.crs != self.tms.rasterio_crs: dst_affine, w, h = calculate_default_transform( - self.dataset.crs, + self.crs, self.tms.rasterio_crs, self.dataset.width, self.dataset.height, @@ -174,33 +147,69 @@ def get_zooms(self, tilesize: int = 256) -> Tuple[int, int]: w = self.dataset.width h = self.dataset.height - # The maxzoom is defined by finding the minimum difference between - # the raster resolution and the zoom level resolution - resolution = max(abs(dst_affine[0]), abs(dst_affine[4])) - maxzoom = self.tms.zoom_for_res(resolution) + return dst_affine, w, h - # The minzoom is defined by the resolution of the maximum theoretical overview level - overview_level = get_maximum_overview_level(w, h, minsize=tilesize) - ovr_resolution = resolution * (2**overview_level) - minzoom = self.tms.zoom_for_res(ovr_resolution) + def get_minzoom(self) -> int: + """Define dataset minimum zoom level.""" + if self._minzoom is None: + # We assume the TMS tilesize to be constant over all matrices + # ref: https://github.com/OSGeo/gdal/blob/dc38aa64d779ecc45e3cd15b1817b83216cf96b8/gdal/frmts/gtiff/cogdriver.cpp#L274 + tilesize = self.tms.tileMatrix[0].tileWidth - return (minzoom, maxzoom) + try: + dst_affine, w, h = self._dst_geom_in_tms_crs() - def _set_zooms(self): - """Calculate raster min/max zoom level.""" - try: - minzoom, maxzoom = self.get_zooms() - except: # noqa - # if we can't get min/max zoom from the dataset we default to TMS min/max zoom - warnings.warn( - "Cannot dertermine min/max zoom based on dataset information, will default to TMS min/max zoom.", - UserWarning, - ) - minzoom, maxzoom = self.tms.minzoom, self.tms.maxzoom + # The minzoom is defined by the resolution of the maximum theoretical overview level + # We assume `tilesize`` is the smallest overview size + overview_level = get_maximum_overview_level(w, h, minsize=tilesize) + + # Get the resolution of the overview + resolution = max(abs(dst_affine[0]), abs(dst_affine[4])) + ovr_resolution = resolution * (2**overview_level) - self.minzoom = self.minzoom if self.minzoom is not None else minzoom - self.maxzoom = self.maxzoom if self.maxzoom is not None else maxzoom - return + # Find what TMS matrix match the overview resolution + self._minzoom = self.tms.zoom_for_res(ovr_resolution) + + except: # noqa + # if we can't get max zoom from the dataset we default to TMS maxzoom + warnings.warn( + "Cannot determine minzoom based on dataset information, will default to TMS minzoom.", + UserWarning, + ) + self._minzoom = self.tms.minzoom + + return self._minzoom + + def get_maxzoom(self) -> int: + """Define dataset maximum zoom level.""" + if self._maxzoom is None: + try: + dst_affine, _, _ = self._dst_geom_in_tms_crs() + + # The maxzoom is defined by finding the minimum difference between + # the raster resolution and the zoom level resolution + resolution = max(abs(dst_affine[0]), abs(dst_affine[4])) + self._maxzoom = self.tms.zoom_for_res(resolution) + + except: # noqa + # if we can't get min/max zoom from the dataset we default to TMS maxzoom + warnings.warn( + "Cannot determine maxzoom based on dataset information, will default to TMS maxzoom.", + UserWarning, + ) + self._maxzoom = self.tms.maxzoom + + return self._maxzoom + + @property + def minzoom(self): + """Return dataset minzoom.""" + return self.get_minzoom() + + @property + def maxzoom(self): + """Return dataset maxzoom.""" + return self.get_maxzoom() def _get_colormap(self): """Retrieve the internal colormap.""" @@ -217,12 +226,12 @@ def _get_descr(ix): """Return band description.""" return self.dataset.descriptions[ix - 1] or "" - if has_alpha_band(self.dataset): + if self.options.get("nodata", self.dataset.nodata) is not None: + nodata_type = "Nodata" + elif has_alpha_band(self.dataset): nodata_type = "Alpha" elif has_mask_band(self.dataset): nodata_type = "Mask" - elif self.nodata is not None: - nodata_type = "Nodata" else: nodata_type = "None" @@ -231,10 +240,10 @@ def _get_descr(ix): "minzoom": self.minzoom, "maxzoom": self.maxzoom, "band_metadata": [ - (f"{ix}", self.dataset.tags(ix)) for ix in self.dataset.indexes + (f"b{ix}", self.dataset.tags(ix)) for ix in self.dataset.indexes ], "band_descriptions": [ - (f"{ix}", _get_descr(ix)) for ix in self.dataset.indexes + (f"b{ix}", _get_descr(ix)) for ix in self.dataset.indexes ], "dtype": self.dataset.meta["dtype"], "colorinterp": [ @@ -257,7 +266,9 @@ def _get_descr(ix): meta.update({"colormap": self.colormap}) if nodata_type == "Nodata": - meta.update({"nodata_value": self.nodata}) + meta.update( + {"nodata_value": self.options.get("nodata", self.dataset.nodata)} + ) return Info(**meta) @@ -268,6 +279,8 @@ def statistics( percentiles: List[int] = [2, 98], hist_options: Optional[Dict] = None, max_size: int = 1024, + indexes: Optional[Indexes] = None, + expression: Optional[str] = None, **kwargs: Any, ) -> Dict[str, BandStatistics]: """Return bands statistics from a dataset. @@ -278,15 +291,17 @@ def statistics( percentiles (list of numbers, optional): list of percentile values to calculate. Defaults to `[2, 98]`. hist_options (dict, optional): Options to forward to numpy.histogram function. max_size (int, optional): Limit the size of the longest dimension of the dataset read, respecting bounds X/Y aspect ratio. Defaults to 1024. - kwargs (optional): Options to forward to `self.preview`. + kwargs (optional): Options to forward to `self.read`. Returns: Dict[str, rio_tiler.models.BandStatistics]: bands statistics. """ - kwargs = {**self._kwargs, **kwargs} + kwargs = {**self.options, **kwargs} - data = self.preview(max_size=max_size, **kwargs) + data = self.read( + max_size=max_size, indexes=indexes, expression=expression, **kwargs + ) hist_options = hist_options or {} @@ -312,6 +327,7 @@ def tile( indexes: Optional[Indexes] = None, expression: Optional[str] = None, tile_buffer: Optional[NumType] = None, + buffer: Optional[float] = None, **kwargs: Any, ) -> ImageData: """Read a Web Map tile from a COG. @@ -323,7 +339,8 @@ def tile( tilesize (int, optional): Output image size. Defaults to `256`. indexes (int or sequence of int, optional): Band indexes. expression (str, optional): rio-tiler expression (e.g. b1/b2+b3). - tile_buffer (int or float, optional): Buffer on each side of the given tile. It must be a multiple of `0.5`. Output **tilesize** will be expanded to `tilesize + 2 * tile_buffer` (e.g 0.5 = 257x257, 1.0 = 258x258). + tile_buffer (int or float, optional): Buffer on each side of the given tile. It must be a multiple of `0.5`. Output **tilesize** will be expanded to `tilesize + 2 * tile_buffer` (e.g 0.5 = 257x257, 1.0 = 258x258). DEPRECATED + buffer (float, optional): Buffer on each side of the given tile. It must be a multiple of `0.5`. Output **tilesize** will be expanded to `tilesize + 2 * tile_buffer` (e.g 0.5 = 257x257, 1.0 = 258x258). kwargs (optional): Options to forward to the `COGReader.part` method. Returns: @@ -336,25 +353,12 @@ def tile( ) tile_bounds = self.tms.xy_bounds(Tile(x=tile_x, y=tile_y, z=tile_z)) - if tile_buffer is not None: - if tile_buffer % 0.5: - raise IncorrectTileBuffer( - "`tile_buffer` must be a multiple of `0.5` (e.g: 0.5, 1, 1.5, ...)." - ) - x_res = (tile_bounds.right - tile_bounds.left) / tilesize - y_res = (tile_bounds.top - tile_bounds.bottom) / tilesize - - # Buffered Tile Bounds - tile_bounds = BoundingBox( - tile_bounds.left - x_res * tile_buffer, - tile_bounds.bottom - y_res * tile_buffer, - tile_bounds.right + x_res * tile_buffer, - tile_bounds.top + y_res * tile_buffer, + if tile_buffer: + warnings.warn( + "`tile_buffer` is deprecated, use `buffer`.", DeprecationWarning ) - - # Buffered Tile Size - tilesize += int(tile_buffer * 2) + buffer = tile_buffer return self.part( tile_bounds, @@ -365,6 +369,7 @@ def tile( max_size=None, indexes=indexes, expression=expression, + buffer=buffer, **kwargs, ) @@ -378,6 +383,7 @@ def part( max_size: Optional[int] = None, height: Optional[int] = None, width: Optional[int] = None, + buffer: Optional[float] = None, **kwargs: Any, ) -> ImageData: """Read part of a COG. @@ -391,16 +397,14 @@ def part( max_size (int, optional): Limit the size of the longest dimension of the dataset read, respecting bounds X/Y aspect ratio. height (int, optional): Output height of the array. width (int, optional): Output width of the array. + buffer (float, optional): Buffer on each side of the given aoi. It must be a multiple of `0.5`. Output **image size** will be expanded to `output imagesize + 2 * buffer` (e.g 0.5 = 257x257, 1.0 = 258x258). kwargs (optional): Options to forward to the `rio_tiler.reader.part` function. Returns: rio_tiler.models.ImageData: ImageData instance with data, mask and input spatial info. """ - kwargs = {**self._kwargs, **kwargs} - - if isinstance(indexes, int): - indexes = (indexes,) + kwargs = {**self.options, **kwargs} if indexes and expression: warnings.warn( @@ -414,7 +418,7 @@ def part( if not dst_crs: dst_crs = bounds_crs - data, mask = reader.part( + img = reader.part( self.dataset, bbox, max_size=max_size, @@ -423,27 +427,15 @@ def part( bounds_crs=bounds_crs, dst_crs=dst_crs, indexes=indexes, + buffer=buffer, **kwargs, ) + img.assets = [self.input] - if expression and indexes: - blocks = get_expression_blocks(expression) - bands = [f"b{bidx}" for bidx in indexes] - data = apply_expression(blocks, bands, data) - - if bounds_crs and bounds_crs != dst_crs: - bbox = transform_bounds(bounds_crs, dst_crs, *bbox, densify_pts=21) - - return ImageData( - data, - mask, - bounds=bbox, - crs=dst_crs, - assets=[self.input], - band_names=get_bands_names( - indexes=indexes, expression=expression, count=data.shape[0] - ), - ) + if expression: + return img.apply_expression(expression) + + return img def preview( self, @@ -462,51 +454,21 @@ def preview( max_size (int, optional): Limit the size of the longest dimension of the dataset read, respecting bounds X/Y aspect ratio. Defaults to 1024. height (int, optional): Output height of the array. width (int, optional): Output width of the array. - kwargs (optional): Options to forward to the `rio_tiler.reader.preview` function. + kwargs (optional): Options to forward to the `self.read` method. Returns: rio_tiler.models.ImageData: ImageData instance with data, mask and input spatial info. """ - kwargs = {**self._kwargs, **kwargs} - - if isinstance(indexes, int): - indexes = (indexes,) - - if indexes and expression: - warnings.warn( - "Both expression and indexes passed; expression will overwrite indexes parameter.", - ExpressionMixingWarning, - ) - - if expression: - indexes = parse_expression(expression) - - data, mask = reader.preview( - self.dataset, + return self.read( indexes=indexes, + expression=expression, max_size=max_size, - width=width, height=height, + width=width, **kwargs, ) - if expression and indexes: - blocks = get_expression_blocks(expression) - bands = [f"b{bidx}" for bidx in indexes] - data = apply_expression(blocks, bands, data) - - return ImageData( - data, - mask, - bounds=self.bounds, - crs=self.crs, - assets=[self.input], - band_names=get_bands_names( - indexes=indexes, expression=expression, count=data.shape[0] - ), - ) - def point( self, lon: float, @@ -515,7 +477,7 @@ def point( indexes: Optional[Indexes] = None, expression: Optional[str] = None, **kwargs: Any, - ) -> List: + ) -> PointData: """Read a pixel value from a COG. Args: @@ -527,13 +489,10 @@ def point( kwargs (optional): Options to forward to the `rio_tiler.reader.point` function. Returns: - list: Pixel value per band indexes. + PointData """ - kwargs = {**self._kwargs, **kwargs} - - if isinstance(indexes, int): - indexes = (indexes,) + kwargs = {**self.options, **kwargs} if indexes and expression: warnings.warn( @@ -544,16 +503,15 @@ def point( if expression: indexes = parse_expression(expression) - point = reader.point( + pt = reader.point( self.dataset, (lon, lat), indexes=indexes, coord_crs=coord_crs, **kwargs ) + pt.assets = [self.input] - if expression and indexes: - blocks = get_expression_blocks(expression) - bands = [f"b{bidx}" for bidx in indexes] - point = apply_expression(blocks, bands, numpy.array(point)).tolist() + if expression: + return pt.apply_expression(expression) - return point + return pt def feature( self, @@ -565,6 +523,7 @@ def feature( max_size: Optional[int] = None, height: Optional[int] = None, width: Optional[int] = None, + buffer: Optional[NumType] = None, **kwargs: Any, ) -> ImageData: """Read part of a COG defined by a geojson feature. @@ -578,6 +537,7 @@ def feature( max_size (int, optional): Limit the size of the longest dimension of the dataset read, respecting bounds X/Y aspect ratio. height (int, optional): Output height of the array. width (int, optional): Output width of the array. + buffer (int or float, optional): Buffer on each side of the given aoi. It must be a multiple of `0.5`. Output **image size** will be expanded to `output imagesize + 2 * buffer` (e.g 0.5 = 257x257, 1.0 = 258x258). kwargs (optional): Options to forward to the `COGReader.part` method. Returns: @@ -604,6 +564,7 @@ def feature( width=width, height=height, vrt_options=vrt_options, + buffer=buffer, **kwargs, ) @@ -624,10 +585,7 @@ def read( rio_tiler.models.ImageData: ImageData instance with data, mask and input spatial info. """ - kwargs = {**self._kwargs, **kwargs} - - if isinstance(indexes, int): - indexes = (indexes,) + kwargs = {**self.options, **kwargs} if indexes and expression: warnings.warn( @@ -638,27 +596,17 @@ def read( if expression: indexes = parse_expression(expression) - data, mask = reader.read(self.dataset, indexes=indexes, **kwargs) - - if expression and indexes: - blocks = get_expression_blocks(expression) - bands = [f"b{bidx}" for bidx in indexes] - data = apply_expression(blocks, bands, data) - - return ImageData( - data, - mask, - bounds=self.bounds, - crs=self.crs, - assets=[self.input], - band_names=get_bands_names( - indexes=indexes, expression=expression, count=data.shape[0] - ), - ) + img = reader.read(self.dataset, indexes=indexes, **kwargs) + img.assets = [self.input] + + if expression: + return img.apply_expression(expression) + + return img @attr.s -class GCPCOGReader(COGReader): +class GCPCOGReader(Reader): """Custom COG Reader with GCPS support. Attributes: @@ -668,21 +616,17 @@ class GCPCOGReader(COGReader): minzoom (int, optional): Overwrite Min Zoom level. maxzoom (int, optional): Overwrite Max Zoom level. colormap (dict, optional): Overwrite internal colormap. - nodata (int or float or str, optional): Global options, overwrite internal nodata value. - unscale (bool, optional): Global options, apply internal scale and offset on all read operations. - resampling_method (rasterio.enums.Resampling, optional): Global options, resampling method to use for read operations. - vrt_options (dict, optional): Global options, WarpedVRT options to use for read operations. - post_process (callable, optional): Global options, Function to apply after all read operations. + options (dict, optional): Options to forward to low-level reader methods. dataset (rasterio.vrtWarpedVRT): Warped VRT constructed with dataset GCPS info. **READ ONLY attribute**. Examples: - >>> with COGReader(src_path) as cog: + >>> with GCPCOGReader(src_path) as cog: cog.tile(...) assert cog.dataset assert cog.src_dataset >>> with rasterio.open(src_path) as src_dst: - with COGReader(None, src_dataset=src_dst) as cog: + with GCPCOGReader(None, src_dataset=src_dst) as cog: cog.tile(...) """ @@ -693,29 +637,23 @@ class GCPCOGReader(COGReader): ) tms: TileMatrixSet = attr.ib(default=WEB_MERCATOR_TMS) - minzoom: int = attr.ib(default=None) - maxzoom: int = attr.ib(default=None) - geographic_crs: CRS = attr.ib(default=WGS84_CRS) colormap: Dict = attr.ib(default=None) - # Define global options to be forwarded to functions reading the data (e.g `rio_tiler.reader.read`) - nodata: Optional[NoData] = attr.ib(default=None) - unscale: Optional[bool] = attr.ib(default=None) - resampling_method: Optional[Resampling] = attr.ib(default=None) - vrt_options: Optional[Dict] = attr.ib(default=None) - post_process: Optional[ - Callable[[numpy.ndarray, numpy.ndarray], DataMaskType] - ] = attr.ib(default=None) + options: reader.Options = attr.ib() # for GCPCOGReader, dataset is not a input option. dataset: WarpedVRT = attr.ib(init=False) + @options.default + def _options_default(self): + return {} + def __attrs_post_init__(self): """Define _kwargs, open dataset and get info.""" warnings.warn( - "GCPCOGReader is deprecated and will be removed in 4.0. Please use COGReader.", + "GCPCOGReader is deprecated and will be removed in 4.0. Please use Reader.", DeprecationWarning, ) @@ -730,3 +668,277 @@ def __attrs_post_init__(self): ) ) super().__attrs_post_init__() + + +@attr.s +class LocalTileMatrixSet: + """Fake TMS for non-geo image.""" + + width: int = attr.ib() + height: int = attr.ib() + tile_size: int = attr.ib(default=256) + + minzoom: int = attr.ib(init=False, default=0) + maxzoom: int = attr.ib(init=False) + + rasterio_crs: CRS = attr.ib(init=False, default=None) + + @maxzoom.default + def _maxzoom(self): + return get_maximum_overview_level( + self.width, + self.height, + minsize=self.tile_size, + ) + + def _ul(self, *tile: Tile) -> Coords: + """Return the upper left coordinate of the (x, y, z) tile.""" + t = _parse_tile_arg(*tile) + + res = 2.0 ** (self.maxzoom - t.z) + xcoord = self.tile_size * t.x * res + ycoord = self.tile_size * t.y * res + + return Coords(xcoord, ycoord) + + def xy_bounds(self, *tile: Tile) -> BoundingBox: + """Return the bounding box of the (x, y, z) tile""" + t = _parse_tile_arg(*tile) + left, top = self._ul(t) + right, bottom = self._ul(Tile(t.x + 1, t.y + 1, t.z)) + return BoundingBox(left, bottom, right, top) + + +@attr.s +class ImageReader(Reader): + """Non Geo Image Reader""" + + tms: TileMatrixSet = attr.ib(init=False) + + crs: CRS = attr.ib(init=False, default=None) + geographic_crs: CRS = attr.ib(init=False, default=None) + + transform: Affine = attr.ib(init=False) + + def __attrs_post_init__(self): + """Define _kwargs, open dataset and get info.""" + + if not self.dataset: + self.dataset = self._ctx_stack.enter_context(rasterio.open(self.input)) + + height, width = self.dataset.height, self.dataset.width + self.bounds = (0, height, width, 0) + self.transform = transform_from_bounds(*self.bounds, width=width, height=height) + + self.tms = LocalTileMatrixSet(width=width, height=height) + self._minzoom = self.tms.minzoom + self._maxzoom = self.tms.maxzoom + + if self.colormap is None: + self._get_colormap() + + if min( + self.dataset.width, self.dataset.height + ) > 512 and not self.dataset.overviews(1): + warnings.warn( + "The dataset has no Overviews. rio-tiler performances might be impacted.", + NoOverviewWarning, + ) + + def tile( # type: ignore + self, + tile_x: int, + tile_y: int, + tile_z: int, + tilesize: int = 256, + indexes: Optional[Indexes] = None, + expression: Optional[str] = None, + force_binary_mask: bool = True, + resampling_method: Resampling = "nearest", + unscale: bool = False, + post_process: Optional[ + Callable[[numpy.ndarray, numpy.ndarray], DataMaskType] + ] = None, + ) -> ImageData: + """Read a Web Map tile from an Image. + + Args: + tile_x (int): Tile's horizontal index. + tile_y (int): Tile's vertical index. + tile_z (int): Tile's zoom level index. + tilesize (int, optional): Output image size. Defaults to `256`. + indexes (int or sequence of int, optional): Band indexes. + expression (str, optional): rio-tiler expression (e.g. b1/b2+b3). + force_binary_mask (bool, optional): Cast returned mask to binary values (0 or 255). Defaults to `True`. + resampling_method (rasterio.enums.Resampling, optional): Rasterio's resampling algorithm. Defaults to `nearest`. + unscale (bool, optional): Apply 'scales' and 'offsets' on output data value. Defaults to `False`. + post_process (callable, optional): Function to apply on output data and mask values. + + Returns: + rio_tiler.models.ImageData: ImageData instance with data, mask and tile spatial info. + + """ + if not self.tile_exists(tile_x, tile_y, tile_z): + raise TileOutsideBounds( + f"Tile {tile_z}/{tile_x}/{tile_y} is outside {self.input} bounds" + ) + + tile_bounds = self.tms.xy_bounds(Tile(x=tile_x, y=tile_y, z=tile_z)) + + return self.part( + tile_bounds, + height=tilesize, + width=tilesize, + max_size=None, + indexes=indexes, + expression=expression, + force_binary_mask=force_binary_mask, + resampling_method=resampling_method, + unscale=unscale, + post_process=post_process, + ) + + def part( # type: ignore + self, + bbox: BBox, + indexes: Optional[Union[int, Sequence]] = None, + expression: Optional[str] = None, + max_size: Optional[int] = None, + height: Optional[int] = None, + width: Optional[int] = None, + force_binary_mask: bool = True, + resampling_method: Resampling = "nearest", + unscale: bool = False, + post_process: Optional[ + Callable[[numpy.ndarray, numpy.ndarray], DataMaskType] + ] = None, + ) -> ImageData: + """Read part of an Image. + + Args: + bbox (tuple): Output bounds (left, bottom, right, top). + indexes (sequence of int or int, optional): Band indexes. + expression (str, optional): rio-tiler expression (e.g. b1/b2+b3). + max_size (int, optional): Limit the size of the longest dimension of the dataset read, respecting bounds X/Y aspect ratio. + height (int, optional): Output height of the array. + width (int, optional): Output width of the array. + force_binary_mask (bool, optional): Cast returned mask to binary values (0 or 255). Defaults to `True`. + resampling_method (rasterio.enums.Resampling, optional): Rasterio's resampling algorithm. Defaults to `nearest`. + unscale (bool, optional): Apply 'scales' and 'offsets' on output data value. Defaults to `False`. + post_process (callable, optional): Function to apply on output data and mask values. + + Returns: + rio_tiler.models.ImageData: ImageData instance with data, mask and input spatial info. + + """ + if indexes and expression: + warnings.warn( + "Both expression and indexes passed; expression will overwrite indexes parameter.", + ExpressionMixingWarning, + ) + + if expression: + indexes = parse_expression(expression) + + window = window_from_bounds(*bbox, transform=self.transform) + img = reader.read( + self.dataset, + window=window, + max_size=max_size, + width=width, + height=height, + indexes=indexes, + force_binary_mask=force_binary_mask, + resampling_method=resampling_method, + unscale=unscale, + post_process=post_process, + ) + img.assets = [self.input] + + if expression: + return img.apply_expression(expression) + + return img + + def point( # type: ignore + self, + x: float, + y: float, + indexes: Optional[Indexes] = None, + expression: Optional[str] = None, + unscale: bool = False, + post_process: Optional[ + Callable[[numpy.ndarray, numpy.ndarray], DataMaskType] + ] = None, + ) -> PointData: + """Read a pixel value from an Image. + + Args: + lon (float): X coordinate. + lat (float): Y coordinate. + indexes (sequence of int or int, optional): Band indexes. + expression (str, optional): rio-tiler expression (e.g. b1/b2+b3). + unscale (bool, optional): Apply 'scales' and 'offsets' on output data value. Defaults to `False`. + post_process (callable, optional): Function to apply on output data and mask values. + + Returns: + PointData + + """ + if not ((0 <= x < self.dataset.width) and (0 <= y < self.dataset.height)): + raise PointOutsideBounds("Point is outside dataset bounds") + + img = self.read( + indexes=indexes, + expression=expression, + unscale=unscale, + post_process=post_process, + window=Window(x, y, 1, 1), + ) + + return PointData( + img.data[:, 0, 0], + numpy.array([img.mask[0, 0]]), + assets=img.assets, + coordinates=self.dataset.xy(x, y), + crs=self.dataset.crs, + band_names=img.band_names, + ) + + def feature( # type: ignore + self, + shape: Dict, + indexes: Optional[Indexes] = None, + expression: Optional[str] = None, + max_size: Optional[int] = None, + height: Optional[int] = None, + width: Optional[int] = None, + force_binary_mask: bool = True, + resampling_method: Resampling = "nearest", + unscale: bool = False, + post_process: Optional[ + Callable[[numpy.ndarray, numpy.ndarray], DataMaskType] + ] = None, + ) -> ImageData: + """Read part of an Image defined by a geojson feature.""" + bbox = featureBounds(shape) + + # If Image Origin is top Left (non-geo) we need to invert the bbox + bbox = [bbox[0], bbox[3], bbox[2], bbox[1]] + + img = self.part( + bbox, + indexes=indexes, + max_size=max_size, + height=height, + width=width, + force_binary_mask=force_binary_mask, + resampling_method=resampling_method, + unscale=unscale, + post_process=post_process, + ) + + shape = shape.get("geometry", shape) + mask = geometry_mask([shape], (img.height, img.width), self.transform) + img.mask = mask * 255 + return img diff --git a/rio_tiler/io/stac.py b/rio_tiler/io/stac.py index d7d32913..058dd611 100644 --- a/rio_tiler/io/stac.py +++ b/rio_tiler/io/stac.py @@ -12,11 +12,11 @@ from morecantile import TileMatrixSet from rasterio.crs import CRS -from ..constants import WEB_MERCATOR_TMS, WGS84_CRS -from ..errors import InvalidAssetName, MissingAssets -from ..utils import aws_get_object -from .base import BaseReader, MultiBaseReader -from .cogeo import COGReader +from rio_tiler.constants import WEB_MERCATOR_TMS, WGS84_CRS +from rio_tiler.errors import InvalidAssetName, MissingAssets +from rio_tiler.io.base import BaseReader, MultiBaseReader +from rio_tiler.io.rasterio import Reader +from rio_tiler.utils import aws_get_object DEFAULT_VALID_TYPE = { "image/tiff; application=geotiff", @@ -130,14 +130,15 @@ class STACReader(MultiBaseReader): Attributes: input (str): STAC Item path, URL or S3 URL. item (dict or pystac.Item, STAC): Stac Item. + tms (morecantile.TileMatrixSet, optional): TileMatrixSet grid definition. Defaults to `WebMercatorQuad`. minzoom (int, optional): Set minzoom for the tiles. maxzoom (int, optional): Set maxzoom for the tiles. geographic_crs (rasterio.crs.CRS, optional): CRS to use as geographic coordinate system. Defaults to WGS84. - include (set of string, optional): Only Include specific assets. - exclude (set of string, optional): Exclude specific assets. + include_assets (set of string, optional): Only Include specific assets. + exclude_assets (set of string, optional): Exclude specific assets. include_asset_types (set of string, optional): Only include some assets base on their type. exclude_asset_types (set of string, optional): Exclude some assets base on their type. - reader (rio_tiler.io.BaseReader, optional): rio-tiler Reader. Defaults to `rio_tiler.io.COGReader`. + reader (rio_tiler.io.BaseReader, optional): rio-tiler Reader. Defaults to `rio_tiler.io.Reader`. reader_options (dict, optional): Additional option to forward to the Reader. Defaults to `{}`. fetch_options (dict, optional): Options to pass to `rio_tiler.io.stac.fetch` function fetching the STAC Items. Defaults to `{}`. @@ -164,8 +165,8 @@ class STACReader(MultiBaseReader): item: pystac.Item = attr.ib(default=None, converter=_to_pystac_item) tms: TileMatrixSet = attr.ib(default=WEB_MERCATOR_TMS) - minzoom: int = attr.ib(default=None) - maxzoom: int = attr.ib(default=None) + minzoom: int = attr.ib() + maxzoom: int = attr.ib() geographic_crs: CRS = attr.ib(default=WGS84_CRS) @@ -175,7 +176,7 @@ class STACReader(MultiBaseReader): include_asset_types: Set[str] = attr.ib(default=DEFAULT_VALID_TYPE) exclude_asset_types: Optional[Set[str]] = attr.ib(default=None) - reader: Type[BaseReader] = attr.ib(default=COGReader) + reader: Type[BaseReader] = attr.ib(default=Reader) reader_options: Dict = attr.ib(factory=dict) fetch_options: Dict = attr.ib(factory=dict) @@ -202,13 +203,13 @@ def __attrs_post_init__(self): if not self.assets: raise MissingAssets("No valid asset found") - if self.minzoom is None: - # TODO get minzoom from PROJ extension - self.minzoom = self.tms.minzoom + @minzoom.default + def _minzoom(self): + return self.tms.minzoom - if self.maxzoom is None: - # TODO get maxzoom from PROJ extension - self.maxzoom = self.tms.maxzoom + @maxzoom.default + def _maxzoom(self): + return self.tms.maxzoom def _get_asset_url(self, asset: str) -> str: """Validate asset names and return asset's url. diff --git a/rio_tiler/io/xarray.py b/rio_tiler/io/xarray.py new file mode 100644 index 00000000..4842b098 --- /dev/null +++ b/rio_tiler/io/xarray.py @@ -0,0 +1,412 @@ +"""rio_tiler.io.xarray: Xarray Reader.""" +from __future__ import annotations + +import warnings +from typing import Any, Dict, List, Optional + +import attr +from morecantile import Tile, TileMatrixSet +from rasterio.crs import CRS +from rasterio.enums import Resampling +from rasterio.features import is_valid_geom +from rasterio.rio.overview import get_maximum_overview_level +from rasterio.transform import from_bounds, rowcol +from rasterio.warp import calculate_default_transform +from rasterio.warp import transform as transform_coords + +from rio_tiler.constants import WEB_MERCATOR_TMS, WGS84_CRS +from rio_tiler.errors import PointOutsideBounds, RioTilerError, TileOutsideBounds +from rio_tiler.io.base import BaseReader +from rio_tiler.models import BandStatistics, ImageData, Info, PointData +from rio_tiler.types import BBox + +try: + import xarray +except ImportError: # pragma: nocover + xarray = None # type: ignore + +try: + import rioxarray +except ImportError: # pragma: nocover + rioxarray = None # type: ignore + + +@attr.s +class XarrayReader(BaseReader): + """Xarray Reader. + + Attributes: + dataset (xarray.DataArray): Xarray DataArray dataset. + tms (morecantile.TileMatrixSet, optional): TileMatrixSet grid definition. Defaults to `WebMercatorQuad`. + geographic_crs (rasterio.crs.CRS, optional): CRS to use as geographic coordinate system. Defaults to WGS84. + + Examples: + >>> ds = xarray.open_dataset( + "https://pangeo.blob.core.windows.net/pangeo-public/daymet-rio-tiler/na-wgs84.zarr", + engine="zarr", + decode_coords="all", + consolidated=True, + ) + da = ds["tmax"] + + with XarrayReader(da) as dst: + img = dst.tile(...) + + """ + + input: xarray.DataArray = attr.ib() + + tms: TileMatrixSet = attr.ib(default=WEB_MERCATOR_TMS) + geographic_crs: CRS = attr.ib(default=WGS84_CRS) + + _minzoom: int = attr.ib(init=False, default=None) + _maxzoom: int = attr.ib(init=False, default=None) + + _dims: List = attr.ib(init=False, factory=list) + + def __attrs_post_init__(self): + """Set bounds and CRS.""" + assert xarray is not None, "xarray must be installed to use XarrayReader" + assert rioxarray is not None, "rioxarray must be installed to use XarrayReader" + + self.bounds = tuple(self.input.rio.bounds()) + self.crs = self.input.rio.crs + + self._dims = [ + d + for d in self.input.dims + if d not in [self.input.rio.x_dim, self.input.rio.y_dim] + ] + + def _dst_geom_in_tms_crs(self): + """Return dataset info in TMS projection.""" + if self.crs != self.tms.rasterio_crs: + dst_affine, w, h = calculate_default_transform( + self.crs, + self.tms.rasterio_crs, + self.input.rio.width, + self.input.rio.height, + *self.bounds, + ) + else: + dst_affine = list(self.input.rio.transform()) + w = self.input.rio.width + h = self.input.rio.height + + return dst_affine, w, h + + def get_minzoom(self) -> int: + """Define dataset minimum zoom level.""" + if self._minzoom is None: + # We assume the TMS tilesize to be constant over all matrices + # ref: https://github.com/OSGeo/gdal/blob/dc38aa64d779ecc45e3cd15b1817b83216cf96b8/gdal/frmts/gtiff/cogdriver.cpp#L274 + tilesize = self.tms.tileMatrix[0].tileWidth + + try: + dst_affine, w, h = self._dst_geom_in_tms_crs() + + # The minzoom is defined by the resolution of the maximum theoretical overview level + # We assume `tilesize`` is the smallest overview size + overview_level = get_maximum_overview_level(w, h, minsize=tilesize) + + # Get the resolution of the overview + resolution = max(abs(dst_affine[0]), abs(dst_affine[4])) + ovr_resolution = resolution * (2**overview_level) + + # Find what TMS matrix match the overview resolution + self._minzoom = self.tms.zoom_for_res(ovr_resolution) + + except: # noqa + # if we can't get min/max zoom from the dataset we default to TMS maxzoom + warnings.warn( + "Cannot determine maxzoom based on dataset information, will default to TMS maxzoom.", + UserWarning, + ) + self._minzoom = self.tms.maxzoom + + return self._minzoom + + def get_maxzoom(self) -> int: + """Define dataset maximum zoom level.""" + if self._maxzoom is None: + try: + dst_affine, _, _ = self._dst_geom_in_tms_crs() + + # The maxzoom is defined by finding the minimum difference between + # the raster resolution and the zoom level resolution + resolution = max(abs(dst_affine[0]), abs(dst_affine[4])) + self._maxzoom = self.tms.zoom_for_res(resolution) + + except: # noqa + # if we can't get min/max zoom from the dataset we default to TMS maxzoom + warnings.warn( + "Cannot determine maxzoom based on dataset information, will default to TMS maxzoom.", + UserWarning, + ) + self._maxzoom = self.tms.maxzoom + + return self._maxzoom + + @property + def minzoom(self): + """Return dataset minzoom.""" + return self.get_minzoom() + + @property + def maxzoom(self): + """Return dataset maxzoom.""" + return self.get_maxzoom() + + def info(self) -> Info: + """Return xarray.DataArray info.""" + bands = [str(band) for d in self._dims for band in self.input[d].values] + metadata = [band.attrs for d in self._dims for band in self.input[d]] + + meta = { + "bounds": self.geographic_bounds, + "minzoom": self.minzoom, + "maxzoom": self.maxzoom, + "band_metadata": [(f"b{ix}", v) for ix, v in enumerate(metadata, 1)], + "band_descriptions": [(f"b{ix}", v) for ix, v in enumerate(bands, 1)], + "dtype": str(self.input.dtype), + "nodata_type": "Nodata" if self.input.rio.nodata is not None else "None", + "name": self.input.name, + "count": self.input.rio.count, + "width": self.input.rio.width, + "height": self.input.rio.height, + "attrs": self.input.attrs, + } + return Info(**meta) + + def statistics( + self, + categorical: bool = False, + categories: Optional[List[float]] = None, + percentiles: List[int] = [2, 98], + hist_options: Optional[Dict] = None, + max_size: int = 1024, + **kwargs: Any, + ) -> Dict[str, BandStatistics]: + """Return bands statistics from a dataset.""" + raise NotImplementedError + + def tile( + self, + tile_x: int, + tile_y: int, + tile_z: int, + tilesize: int = 256, + resampling_method: Resampling = "nearest", + ) -> ImageData: + """Read a Web Map tile from a dataset. + + Args: + tile_x (int): Tile's horizontal index. + tile_y (int): Tile's vertical index. + tile_z (int): Tile's zoom level index. + tilesize (int, optional): Output image size. Defaults to `256`. + resampling_method (rasterio.enums.Resampling, optional): Rasterio's resampling algorithm. Defaults to `nearest`. + + Returns: + rio_tiler.models.ImageData: ImageData instance with data, mask and tile spatial info. + + """ + if not self.tile_exists(tile_x, tile_y, tile_z): + raise TileOutsideBounds( + f"Tile {tile_z}/{tile_x}/{tile_y} is outside bounds" + ) + + tile_bounds = self.tms.xy_bounds(Tile(x=tile_x, y=tile_y, z=tile_z)) + + # Create source array by clipping the xarray dataset to extent of the tile. + ds = self.input.rio.clip_box(*tile_bounds, crs=self.tms.rasterio_crs) + ds = ds.rio.reproject( + self.tms.rasterio_crs, + shape=(tilesize, tilesize), + transform=from_bounds(*tile_bounds, height=tilesize, width=tilesize), + resampling=Resampling[resampling_method], + ) + + # Forward valid_min/valid_max to the ImageData object + minv, maxv = ds.attrs.get("valid_min"), ds.attrs.get("valid_max") + stats = None + if minv is not None and maxv is not None: + stats = ((minv, maxv),) * ds.rio.count + + band_names = [str(band) for d in self._dims for band in self.input[d].values] + + return ImageData( + ds.data, + bounds=tile_bounds, + crs=self.tms.rasterio_crs, + dataset_statistics=stats, + band_names=band_names, + ) + + def part( + self, + bbox: BBox, + dst_crs: Optional[CRS] = None, + bounds_crs: CRS = WGS84_CRS, + resampling_method: Resampling = "nearest", + ) -> ImageData: + """Read part of a dataset. + + Args: + bbox (tuple): Output bounds (left, bottom, right, top) in target crs ("dst_crs"). + dst_crs (rasterio.crs.CRS, optional): Overwrite target coordinate reference system. + bounds_crs (rasterio.crs.CRS, optional): Bounds Coordinate Reference System. Defaults to `epsg:4326`. + resampling_method (rasterio.enums.Resampling, optional): Rasterio's resampling algorithm. Defaults to `nearest`. + + Returns: + rio_tiler.models.ImageData: ImageData instance with data, mask and input spatial info. + + """ + dst_crs = dst_crs or bounds_crs + ds = self.input.rio.clip_box(*bbox, crs=bounds_crs) + + if dst_crs != self.crs: + dst_transform, w, h = calculate_default_transform( + self.crs, + dst_crs, + ds.rio.width, + ds.rio.height, + *ds.rio.bounds(), + ) + ds = ds.rio.reproject( + dst_crs, + shape=(h, w), + transform=dst_transform, + resampling=Resampling[resampling_method], + ) + + # Forward valid_min/valid_max to the ImageData object + minv, maxv = ds.attrs.get("valid_min"), ds.attrs.get("valid_max") + stats = None + if minv is not None and maxv is not None: + stats = ((minv, maxv),) * ds.rio.count + + band_names = [str(band) for d in self._dims for band in self.input[d].values] + + return ImageData( + ds.data, + bounds=ds.rio.bounds(), + crs=ds.rio.crs, + dataset_statistics=stats, + band_names=band_names, + ) + + def preview( + self, + max_size: int = 1024, + height: Optional[int] = None, + width: Optional[int] = None, + ) -> ImageData: + """Return a preview of a dataset. + + Args: + max_size (int, optional): Limit the size of the longest dimension of the dataset read, respecting bounds X/Y aspect ratio. Defaults to 1024. + height (int, optional): Output height of the array. + width (int, optional): Output width of the array. + + Returns: + rio_tiler.models.ImageData: ImageData instance with data, mask and input spatial info. + + """ + raise NotImplementedError + + def point( + self, + lon: float, + lat: float, + coord_crs: CRS = WGS84_CRS, + ) -> PointData: + """Read a pixel value from a dataset. + + Args: + lon (float): Longitude. + lat (float): Latitude. + coord_crs (rasterio.crs.CRS, optional): Coordinate Reference System of the input coords. Defaults to `epsg:4326`. + + Returns: + PointData + + """ + ds_lon, ds_lat = transform_coords(coord_crs, self.crs, [lon], [lat]) + + if not ( + (self.bounds[0] < ds_lon[0] < self.bounds[2]) + and (self.bounds[1] < ds_lat[0] < self.bounds[3]) + ): + raise PointOutsideBounds("Point is outside dataset bounds") + + x, y = rowcol(self.input.rio.transform(), ds_lon, ds_lat) + + band_names = [str(band) for d in self._dims for band in self.input[d].values] + + return PointData( + self.input.data[:, y[0], y[0]], + coordinates=(lon, lat), + crs=coord_crs, + band_names=band_names, + ) + + def feature( + self, + shape: Dict, + dst_crs: Optional[CRS] = None, + shape_crs: CRS = WGS84_CRS, + resampling_method: Resampling = "nearest", + ) -> ImageData: + """Read part of a dataset defined by a geojson feature. + + Args: + shape (dict): Valid GeoJSON feature. + dst_crs (rasterio.crs.CRS, optional): Overwrite target coordinate reference system. + shape_crs (rasterio.crs.CRS, optional): Input geojson coordinate reference system. Defaults to `epsg:4326`. + + Returns: + rio_tiler.models.ImageData: ImageData instance with data, mask and input spatial info. + + """ + if not dst_crs: + dst_crs = shape_crs + + if "geometry" in shape: + shape = shape["geometry"] + + if not is_valid_geom(shape): + raise RioTilerError("Invalid geometry") + + ds = self.input.rio.clip([shape], crs=shape_crs) + + if dst_crs != self.crs: + dst_transform, w, h = calculate_default_transform( + self.crs, + dst_crs, + ds.rio.width, + ds.rio.height, + *ds.rio.bounds(), + ) + ds = ds.rio.reproject( + dst_crs, + shape=(h, w), + transform=dst_transform, + resampling=Resampling[resampling_method], + ) + + # Forward valid_min/valid_max to the ImageData object + minv, maxv = ds.attrs.get("valid_min"), ds.attrs.get("valid_max") + stats = None + if minv is not None and maxv is not None: + stats = ((minv, maxv),) * ds.rio.count + + band_names = [str(band) for d in self._dims for band in self.input[d].values] + + return ImageData( + ds.data, + bounds=ds.rio.bounds(), + crs=ds.rio.crs, + dataset_statistics=stats, + band_names=band_names, + ) diff --git a/rio_tiler/models.py b/rio_tiler/models.py index e67dee30..3e20b236 100644 --- a/rio_tiler/models.py +++ b/rio_tiler/models.py @@ -17,9 +17,10 @@ from rio_color.operations import parse_operations from rio_color.utils import scale_dtype, to_math_type -from .errors import InvalidDatatypeWarning -from .types import ColorMapType, GDALColorMapType, IntervalTuple, NumType -from .utils import linear_rescale, render, resize_array +from rio_tiler.errors import InvalidDatatypeWarning +from rio_tiler.expression import apply_expression, get_expression_blocks +from rio_tiler.types import ColorMapType, GDALColorMapType, IntervalTuple, NumType +from rio_tiler.utils import linear_rescale, render, resize_array class NodataTypes(str, Enum): @@ -130,6 +131,119 @@ def rescale_image( return data.astype(out_dtype) +@attr.s +class PointData: + """Point Data class. + + Attributes: + data (numpy.ndarray): pixel values. + mask (numpy.ndarray): rasterio mask values. + band_names (list): name of each band. Defaults to `["1", "2", "3"]` for 3 bands image. + coordinates (tuple): Point's coordinates. + crs (rasterio.crs.CRS, optional): Coordinates Reference System of the bounds. + assets (list, optional): list of assets used to construct the data values. + metadata (dict, optional): Additional metadata. Defaults to `{}`. + + """ + + data: numpy.ndarray = attr.ib() + mask: numpy.ndarray = attr.ib() + band_names: List[str] = attr.ib() + coordinates: Optional[Tuple[float, float]] = attr.ib(default=None) + crs: Optional[CRS] = attr.ib(default=None) + assets: Optional[List] = attr.ib(default=None) + metadata: Optional[Dict] = attr.ib(factory=dict) + + @data.validator + def _validate_data(self, attribute, value): + """PointsData data has to be a 1d array.""" + if not len(value.shape) == 1: + raise ValueError("PointsData data has to be a 1D array") + + @coordinates.validator + def _validate_coordinates(self, attribute, value): + """coordinates has to be a 2d list.""" + if value and not len(value) == 2: + raise ValueError("Coordinates data has to be a 2d list") + + @band_names.default + def _default_names(self): + return [f"b{ix + 1}" for ix in range(self.count)] + + @mask.default + def _default_mask(self): + return numpy.zeros(self.data.shape[0], dtype="uint8") + 255 + + def __iter__(self): + """Allow for variable expansion.""" + for i in self.data: + yield i + + @property + def count(self) -> int: + """Number of band.""" + return self.data.shape[0] + + @classmethod + def create_from_list(cls, data: Sequence["PointData"]): + """Create PointData from a sequence of PointsData objects. + + Args: + data (sequence): sequence of PointData. + + """ + # validate coordinates + if all([pt.coordinates or pt.crs or None for pt in data]): + lon, lat, crs = zip(*[(*(pt.coordinates or []), pt.crs) for pt in data]) + if len(set(lon)) > 1 or len(set(lat)) > 1 or len(set(crs)) > 1: + raise Exception( + "Cannot concatenate points with different coordinates/CRS." + ) + + arr = numpy.concatenate([pt.data for pt in data]) + mask = numpy.concatenate([pt.mask for pt in data]) + + assets = list( + dict.fromkeys( + itertools.chain.from_iterable([pt.assets for pt in data if pt.assets]) + ) + ) + + band_names = list( + itertools.chain.from_iterable( + [pt.band_names for pt in data if pt.band_names] + ) + ) + + return cls( + arr, + mask, + assets=assets, + crs=data[0].crs, + coordinates=data[0].coordinates, + band_names=band_names, + ) + + def as_masked(self) -> numpy.ma.MaskedArray: + """return a numpy masked array.""" + data = numpy.ma.array(self.data) + data.mask = self.mask == 0 + return data + + def apply_expression(self, expression: str) -> "PointData": + """Apply expression to the image data.""" + blocks = get_expression_blocks(expression) + return PointData( + apply_expression(blocks, self.band_names, self.data), + self.mask, + assets=self.assets, + crs=self.crs, + coordinates=self.coordinates, + band_names=blocks, + metadata=self.metadata, + ) + + @attr.s class ImageData: """Image Data class. @@ -142,6 +256,7 @@ class ImageData: crs (rasterio.crs.CRS, optional): Coordinates Reference System of the bounds. metadata (dict, optional): Additional metadata. Defaults to `{}`. band_names (list, optional): name of each band. Defaults to `["1", "2", "3"]` for 3 bands image. + dataset_statistics (list, optional): dataset statistics `[(min, max), (min, max)]` """ @@ -152,6 +267,7 @@ class ImageData: crs: Optional[CRS] = attr.ib(default=None) metadata: Optional[Dict] = attr.ib(factory=dict) band_names: List[str] = attr.ib() + dataset_statistics: Optional[Sequence[Tuple[float, float]]] = attr.ib(default=None) @data.validator def _validate_data(self, attribute, value): @@ -163,7 +279,7 @@ def _validate_data(self, attribute, value): @band_names.default def _default_names(self): - return [f"{ix + 1}" for ix in range(self.count)] + return [f"b{ix + 1}" for ix in range(self.count)] @mask.default def _default_mask(self): @@ -217,8 +333,21 @@ def create_from_list(cls, data: Sequence["ImageData"]): ) ) + stats = list( + itertools.chain.from_iterable( + [img.dataset_statistics for img in data if img.dataset_statistics] + ) + ) + dataset_statistics = stats if len(stats) == len(band_names) else None + return cls( - arr, mask, assets=assets, crs=crs, bounds=bounds, band_names=band_names + arr, + mask, + assets=assets, + crs=crs, + bounds=bounds, + band_names=band_names, + dataset_statistics=dataset_statistics, ) def as_masked(self) -> numpy.ma.MaskedArray: @@ -266,13 +395,46 @@ def rescale( out_dtype: Union[str, numpy.number] = "uint8", ): """Rescale data in place.""" - self.data = rescale_image(self.data, self.mask, in_range, out_range, out_dtype) + self.data = rescale_image( + self.data.copy(), + self.mask, + in_range=in_range, + out_range=out_range, + out_dtype=out_dtype, + ) def apply_color_formula(self, color_formula: Optional[str]): """Apply rio-color formula in place.""" - self.data[self.data < 0] = 0 + out = self.data.copy() + out[out < 0] = 0 + for ops in parse_operations(color_formula): - self.data = scale_dtype(ops(to_math_type(self.data)), numpy.uint8) + out = scale_dtype(ops(to_math_type(out)), numpy.uint8) + + self.data = out + + def apply_expression(self, expression: str) -> "ImageData": + """Apply expression to the image data.""" + blocks = get_expression_blocks(expression) + + stats = self.dataset_statistics + if stats: + res = [] + for prod in itertools.product(*stats): # type: ignore + res.append(apply_expression(blocks, self.band_names, numpy.array(prod))) + + stats = list(zip([min(r) for r in zip(*res)], [max(r) for r in zip(*res)])) + + return ImageData( + apply_expression(blocks, self.band_names, self.data), + self.mask.copy(), + assets=self.assets, + crs=self.crs, + bounds=self.bounds, + band_names=blocks, + metadata=self.metadata, + dataset_statistics=stats, + ) def post_process( self, @@ -346,22 +508,23 @@ def render( kwargs.update({"crs": self.crs}) data = self.data.copy() - datatype_range = (dtype_ranges[str(data.dtype)],) + mask = self.mask.copy() + datatype_range = self.dataset_statistics or (dtype_ranges[str(data.dtype)],) if not colormap: if img_format in ["PNG"] and data.dtype not in ["uint8", "uint16"]: warnings.warn( - f"Invalid type: `{data.dtype}` for the `{img_format}` driver. Data will be rescaled using min/max type bounds.", + f"Invalid type: `{data.dtype}` for the `{img_format}` driver. Data will be rescaled using min/max type bounds or dataset_statistics.", InvalidDatatypeWarning, ) - data = rescale_image(data, self.mask, in_range=datatype_range) + data = rescale_image(data, mask, in_range=datatype_range) elif img_format in ["JPEG", "WEBP"] and data.dtype not in ["uint8"]: warnings.warn( - f"Invalid type: `{data.dtype}` for the `{img_format}` driver. Data will be rescaled using min/max type bounds.", + f"Invalid type: `{data.dtype}` for the `{img_format}` driver. Data will be rescaled using min/max type bounds or dataset_statistics.", InvalidDatatypeWarning, ) - data = rescale_image(data, self.mask, in_range=datatype_range) + data = rescale_image(data, mask, in_range=datatype_range) elif img_format in ["JP2OPENJPEG"] and data.dtype not in [ "uint8", @@ -369,14 +532,14 @@ def render( "uint16", ]: warnings.warn( - f"Invalid type: `{data.dtype}` for the `{img_format}` driver. Data will be rescaled using min/max type bounds.", + f"Invalid type: `{data.dtype}` for the `{img_format}` driver. Data will be rescaled using min/max type bounds or dataset_statistics.", InvalidDatatypeWarning, ) - data = rescale_image(data, self.mask, in_range=datatype_range) + data = rescale_image(data, mask, in_range=datatype_range) if add_mask: return render( - data, self.mask, img_format=img_format, colormap=colormap, **kwargs + data, mask, img_format=img_format, colormap=colormap, **kwargs ) return render(data, img_format=img_format, colormap=colormap, **kwargs) diff --git a/rio_tiler/mosaic/methods/defaults.py b/rio_tiler/mosaic/methods/defaults.py index ac460ebb..a1728cb1 100644 --- a/rio_tiler/mosaic/methods/defaults.py +++ b/rio_tiler/mosaic/methods/defaults.py @@ -2,7 +2,7 @@ import numpy -from .base import MosaicMethodBase +from rio_tiler.mosaic.methods.base import MosaicMethodBase class FirstMethod(MosaicMethodBase): diff --git a/rio_tiler/mosaic/reader.py b/rio_tiler/mosaic/reader.py index 3b94f2ae..a8e2abbf 100644 --- a/rio_tiler/mosaic/reader.py +++ b/rio_tiler/mosaic/reader.py @@ -5,14 +5,14 @@ from rasterio.crs import CRS -from ..constants import MAX_THREADS -from ..errors import EmptyMosaicError, InvalidMosaicMethod, TileOutsideBounds -from ..models import ImageData -from ..tasks import create_tasks, filter_tasks -from ..types import BBox -from ..utils import _chunks -from .methods.base import MosaicMethodBase -from .methods.defaults import FirstMethod +from rio_tiler.constants import MAX_THREADS +from rio_tiler.errors import EmptyMosaicError, InvalidMosaicMethod, TileOutsideBounds +from rio_tiler.models import ImageData +from rio_tiler.mosaic.methods.base import MosaicMethodBase +from rio_tiler.mosaic.methods.defaults import FirstMethod +from rio_tiler.tasks import create_tasks, filter_tasks +from rio_tiler.types import BBox +from rio_tiler.utils import _chunks def mosaic_reader( diff --git a/rio_tiler/reader.py b/rio_tiler/reader.py index b75fc8bc..301fe310 100644 --- a/rio_tiler/reader.py +++ b/rio_tiler/reader.py @@ -1,8 +1,9 @@ """rio-tiler.reader: low level reader.""" +import contextlib import math import warnings -from typing import Any, Callable, Dict, List, Optional, Tuple, Union +from typing import Callable, Dict, Optional, Tuple, TypedDict, Union import numpy from affine import Affine @@ -14,147 +15,291 @@ from rasterio.warp import transform as transform_coords from rasterio.warp import transform_bounds -from .constants import WGS84_CRS -from .errors import AlphaBandWarning, PointOutsideBounds, TileOutsideBounds -from .types import BBox, DataMaskType, Indexes, NoData -from .utils import _requested_tile_aligned_with_internal_tile as is_aligned -from .utils import get_vrt_transform, has_alpha_band, non_alpha_indexes +from rio_tiler.constants import WGS84_CRS +from rio_tiler.errors import InvalidBufferSize, PointOutsideBounds, TileOutsideBounds +from rio_tiler.models import ImageData, PointData +from rio_tiler.types import BBox, DataMaskType, Indexes, NoData +from rio_tiler.utils import _requested_tile_aligned_with_internal_tile as is_aligned +from rio_tiler.utils import get_vrt_transform, has_alpha_band, non_alpha_indexes + + +class Options(TypedDict, total=False): + """Reader Options.""" + + nodata: Optional[NoData] + vrt_options: Optional[Dict] + resampling_method: Optional[Resampling] + unscale: Optional[bool] + post_process: Optional[Callable[[numpy.ndarray, numpy.ndarray], DataMaskType]] + + +def _get_width_height(max_size, dataset_height, dataset_width) -> Tuple[int, int]: + """Get Output Width/Height based on a max_size and dataset shape.""" + if max(dataset_height, dataset_width) < max_size: + return dataset_height, dataset_width + + ratio = dataset_height / dataset_width + if ratio > 1: + height = max_size + width = math.ceil(height / ratio) + else: + width = max_size + height = math.ceil(width * ratio) + + return height, width + + +def _apply_buffer( + buffer: float, + bounds: BBox, + height: int, + width: int, +) -> Tuple[BBox, int, int]: + """Apply buffer on bounds.""" + x_res = (bounds[2] - bounds[0]) / width + y_res = (bounds[3] - bounds[1]) / height + + # apply buffer to bounds + bounds = ( + bounds[0] - x_res * buffer, + bounds[1] - y_res * buffer, + bounds[2] + x_res * buffer, + bounds[3] + y_res * buffer, + ) + + # new output size + height += int(buffer * 2) + width += int(buffer * 2) + + return bounds, height, width def read( src_dst: Union[DatasetReader, DatasetWriter, WarpedVRT], + dst_crs: Optional[CRS] = None, height: Optional[int] = None, width: Optional[int] = None, + max_size: Optional[int] = None, indexes: Optional[Indexes] = None, window: Optional[windows.Window] = None, force_binary_mask: bool = True, nodata: Optional[NoData] = None, - unscale: bool = False, - resampling_method: Resampling = "nearest", vrt_options: Optional[Dict] = None, + resampling_method: Resampling = "nearest", + unscale: bool = False, post_process: Optional[ Callable[[numpy.ndarray, numpy.ndarray], DataMaskType] ] = None, -) -> DataMaskType: +) -> ImageData: """Low level read function. Args: src_dst (rasterio.io.DatasetReader or rasterio.io.DatasetWriter or rasterio.vrt.WarpedVRT): Rasterio dataset. - height (int, optional): Output height of the array. - width (int, optional): Output width of the array. + dst_crs (rasterio.crs.CRS, optional): Target coordinate reference system. + height (int, optional): Output height of the image. + width (int, optional): Output width of the image. + max_size (int, optional): Limit output size image if not width and height. indexes (sequence of int or int, optional): Band indexes. window (rasterio.windows.Window, optional): Window to read. - force_binary_mask (bool, optional): Cast returned mask to binary values (0 or 255). Defaults to `True`. nodata (int or float, optional): Overwrite dataset internal nodata value. - unscale (bool, optional): Apply 'scales' and 'offsets' on output data value. Defaults to `False`. - resampling_method (rasterio.enums.Resampling, optional): Rasterio's resampling algorithm. Defaults to `nearest`. vrt_options (dict, optional): Options to be passed to the rasterio.warp.WarpedVRT class. + resampling_method (rasterio.enums.Resampling, optional): Rasterio's resampling algorithm. Defaults to `nearest`. + force_binary_mask (bool, optional): Cast returned mask to binary values (0 or 255). Defaults to `True`. + unscale (bool, optional): Apply 'scales' and 'offsets' on output data value. Defaults to `False`. post_process (callable, optional): Function to apply on output data and mask values. Returns: - tuple: Data (numpy.ndarray) and Mask (numpy.ndarray) values. + ImageData """ if isinstance(indexes, int): indexes = (indexes,) - if indexes is None: - indexes = non_alpha_indexes(src_dst) - if indexes != src_dst.indexes: - warnings.warn( - "Alpha band was removed from the output data array", AlphaBandWarning - ) + if max_size and width and height: + warnings.warn( + "'max_size' will be ignored with with 'height' and 'width' set.", + UserWarning, + ) - vrt_params = dict(add_alpha=True, resampling=Resampling[resampling_method]) - nodata = nodata if nodata is not None else src_dst.nodata - if nodata is not None: - vrt_params.update(dict(nodata=nodata, add_alpha=False, src_nodata=nodata)) + resampling = Resampling[resampling_method] + dst_crs = dst_crs or src_dst.crs + with contextlib.ExitStack() as ctx: + # Use WarpedVRT when Re-projection or Nodata or User VRT Option (cutline) + if (dst_crs != src_dst.crs) or nodata is not None or vrt_options: + vrt_params = { + "crs": dst_crs, + "add_alpha": True, + "resampling": resampling, + } - if has_alpha_band(src_dst): - vrt_params.update(dict(add_alpha=False)) + nodata = nodata if nodata is not None else src_dst.nodata + if nodata is not None: + vrt_params.update( + {"nodata": nodata, "add_alpha": False, "src_nodata": nodata} + ) - if vrt_options: - vrt_params.update(vrt_options) + if has_alpha_band(src_dst): + vrt_params.update({"add_alpha": False}) - with WarpedVRT(src_dst, **vrt_params) as vrt: - if ColorInterp.alpha in vrt.colorinterp: - indexes = tuple(indexes) + (vrt.colorinterp.index(ColorInterp.alpha) + 1,) - data = vrt.read( - indexes=indexes, + if vrt_options: + vrt_params.update(**vrt_options) + + # TODO: Check if we fetch the Overviews when not using transform + dataset = ctx.enter_context(WarpedVRT(src_dst, **vrt_params)) + + else: + dataset = src_dst + + if max_size and not (width and height): + height, width = _get_width_height(max_size, dataset.height, dataset.width) + + if indexes is None: + indexes = non_alpha_indexes(dataset) + + boundless = False + if window: + if isinstance(window, tuple): + window = windows.Window.from_slices( + *window, height=dataset.height, width=dataset.width, boundless=True + ) + + (row_start, row_stop), (col_start, col_stop) = window.toranges() + if ( + min(col_start, row_start) < 0 + or row_stop >= dataset.width + or col_stop >= dataset.height + ): + boundless = True + + if ColorInterp.alpha in dataset.colorinterp: + # If dataset has an alpha band we need to get the mask using the alpha band index + # and then split the data and mask values + alpha_idx = dataset.colorinterp.index(ColorInterp.alpha) + 1 + idx = tuple(indexes) + (alpha_idx,) + data = dataset.read( + indexes=idx, window=window, - out_shape=(len(indexes), height, width) if height and width else None, - resampling=Resampling[resampling_method], + out_shape=(len(idx), height, width) if height and width else None, + resampling=resampling, + boundless=boundless, ) data, mask = data[0:-1], data[-1].astype("uint8") else: - data = vrt.read( + data = dataset.read( indexes=indexes, window=window, out_shape=(len(indexes), height, width) if height and width else None, - resampling=Resampling[resampling_method], + resampling=resampling, + boundless=boundless, ) - mask = vrt.dataset_mask( + mask = dataset.dataset_mask( window=window, out_shape=(height, width) if height and width else None, - resampling=Resampling[resampling_method], + resampling=resampling, + boundless=boundless, ) - if force_binary_mask: - mask = numpy.where(mask != 0, numpy.uint8(255), numpy.uint8(0)) + stats = [] + for ix in indexes: + tags = dataset.tags(ix) + if all( + stat in tags for stat in ["STATISTICS_MINIMUM", "STATISTICS_MAXIMUM"] + ): + stat_min = float(tags.get("STATISTICS_MINIMUM")) + stat_max = float(tags.get("STATISTICS_MAXIMUM")) + stats.append((stat_min, stat_max)) + + # We only add dataset statistics if we have them for all the indexes + dataset_statistics = stats if len(stats) == len(indexes) else None - if unscale: - data = data.astype("float32", casting="unsafe") - numpy.multiply(data, src_dst.scales[0], out=data, casting="unsafe") - numpy.add(data, src_dst.offsets[0], out=data, casting="unsafe") + if force_binary_mask: + mask = numpy.where(mask != 0, numpy.uint8(255), numpy.uint8(0)) - if post_process: - data, mask = post_process(data, mask) + if unscale: + data = data.astype("float32", casting="unsafe") + numpy.multiply(data, dataset.scales[0], out=data, casting="unsafe") + numpy.add(data, dataset.offsets[0], out=data, casting="unsafe") - return data, mask + if post_process: + data, mask = post_process(data, mask) + out_bounds = ( + windows.bounds(window, dataset.transform) if window else dataset.bounds + ) + + img = ImageData( + data, + mask, + bounds=out_bounds, + crs=dataset.crs, + band_names=[f"b{idx}" for idx in indexes], + dataset_statistics=dataset_statistics, + ) + return img + + +# flake8: noqa: C901 def part( src_dst: Union[DatasetReader, DatasetWriter, WarpedVRT], bounds: BBox, height: Optional[int] = None, width: Optional[int] = None, - padding: int = 0, + max_size: Optional[int] = None, dst_crs: Optional[CRS] = None, bounds_crs: Optional[CRS] = None, + indexes: Optional[Indexes] = None, minimum_overlap: Optional[float] = None, + padding: Optional[int] = None, + buffer: Optional[float] = None, + force_binary_mask: bool = True, + nodata: Optional[NoData] = None, vrt_options: Optional[Dict] = None, - max_size: Optional[int] = None, - **kwargs: Any, -) -> DataMaskType: + resampling_method: Resampling = "nearest", + unscale: bool = False, + post_process: Optional[ + Callable[[numpy.ndarray, numpy.ndarray], DataMaskType] + ] = None, +) -> ImageData: """Read part of a dataset. Args: src_dst (rasterio.io.DatasetReader or rasterio.io.DatasetWriter or rasterio.vrt.WarpedVRT): Rasterio dataset. bounds (tuple): Output bounds (left, bottom, right, top). By default the coordinates are considered to be in either the dataset CRS or in the `dst_crs` if set. Use `bounds_crs` to set a specific CRS. - height (int, optional): Output height of the array. - width (int, optional): Output width of the array. - padding (int, optional): Padding to apply to each edge of the tile when retrieving data to assist in reducing resampling artefacts along edges. Defaults to `0`. + height (int, optional): Output height of the image. + width (int, optional): Output width of the image. + max_size (int, optional): Limit output size image if not width and height. dst_crs (rasterio.crs.CRS, optional): Target coordinate reference system. bounds_crs (rasterio.crs.CRS, optional): Overwrite bounds Coordinate Reference System. + indexes (sequence of int or int, optional): Band indexes. minimum_overlap (float, optional): Minimum % overlap for which to raise an error with dataset not covering enough of the tile. + padding (int, optional): Padding to apply to each bbox edge. Helps reduce resampling artefacts along edges. Defaults to `0`. + buffer (float, optional): Buffer to apply to each bbox edge. Defaults to `0.`. + nodata (int or float, optional): Overwrite dataset internal nodata value. vrt_options (dict, optional): Options to be passed to the rasterio.warp.WarpedVRT class. - max_size (int, optional): Limit output size array if not width and height. - kwargs (optional): Additional options to forward to `rio_tiler.reader.read`. + resampling_method (rasterio.enums.Resampling, optional): Rasterio's resampling algorithm. Defaults to `nearest`. + force_binary_mask (bool, optional): Cast returned mask to binary values (0 or 255). Defaults to `True`. + unscale (bool, optional): Apply 'scales' and 'offsets' on output data value. Defaults to `False`. + post_process (callable, optional): Function to apply on output data and mask values. Returns: - tuple: Data (numpy.ndarray) and Mask (numpy.ndarray) values. + ImageData """ - if not dst_crs: - dst_crs = src_dst.crs - if max_size and width and height: warnings.warn( "'max_size' will be ignored with with 'height' and 'width' set.", UserWarning, ) + if buffer and buffer % 0.5: + raise InvalidBufferSize( + "`buffer` must be a multiple of `0.5` (e.g: 0.5, 1, 1.5, ...)." + ) + + padding = padding or 0 + dst_crs = dst_crs or src_dst.crs if bounds_crs: bounds = transform_bounds(bounds_crs, dst_crs, *bounds, densify_pts=21) @@ -177,106 +322,126 @@ def part( "Dataset covers less than {:.0f}% of tile".format(cover_ratio * 100) ) - vrt_transform, vrt_width, vrt_height = get_vrt_transform( - src_dst, bounds, height, width, dst_crs=dst_crs - ) + # Use WarpedVRT when Re-projection or Nodata or User VRT Option (cutline) + if (dst_crs != src_dst.crs) or nodata is not None or vrt_options: + window = None + vrt_transform, vrt_width, vrt_height = get_vrt_transform( + src_dst, + bounds, + height=height, + width=width, + dst_crs=dst_crs, + ) - window = windows.Window(col_off=0, row_off=0, width=vrt_width, height=vrt_height) + if max_size and not (width and height): + height, width = _get_width_height(max_size, vrt_height, vrt_width) - if max_size and not (width and height): - if max(vrt_width, vrt_height) > max_size: - ratio = vrt_height / vrt_width - if ratio > 1: - height = max_size - width = math.ceil(height / ratio) - else: - width = max_size - height = math.ceil(width * ratio) - - out_height = height or vrt_height - out_width = width or vrt_width - if padding > 0 and not is_aligned(src_dst, bounds, out_height, out_width, dst_crs): - vrt_transform = vrt_transform * Affine.translation(-padding, -padding) - orig_vrt_height = vrt_height - orig_vrt_width = vrt_width - vrt_height = vrt_height + 2 * padding - vrt_width = vrt_width + 2 * padding - window = windows.Window( - col_off=padding, - row_off=padding, - width=orig_vrt_width, - height=orig_vrt_height, - ) + height = height or vrt_height + width = width or vrt_width + + if buffer: + bounds, height, width = _apply_buffer(buffer, bounds, height, width) + # re-calculate the transform given the new bounds, height and width + vrt_transform, vrt_width, vrt_height = get_vrt_transform( + src_dst, bounds, height, width, dst_crs=dst_crs + ) - vrt_options = vrt_options or {} - vrt_options.update( - { + if padding > 0 and not is_aligned(src_dst, bounds, bounds_crs=dst_crs): + vrt_transform = vrt_transform * Affine.translation(-padding, -padding) + window = windows.Window( + col_off=padding, row_off=padding, width=vrt_width, height=vrt_height + ) + vrt_height = vrt_height + 2 * padding + vrt_width = vrt_width + 2 * padding + + vrt_params = { "crs": dst_crs, "transform": vrt_transform, "width": vrt_width, "height": vrt_height, } - ) + if vrt_options: + vrt_params.update(**vrt_options) + + return read( + src_dst, + indexes=indexes, + width=width, + height=height, + window=window, + nodata=nodata, + vrt_options=vrt_params, + resampling_method=resampling_method, + force_binary_mask=force_binary_mask, + unscale=unscale, + post_process=post_process, + ) + + # else no re-projection needed + window = windows.from_bounds(*bounds, transform=src_dst.transform) + if max_size and not (width and height): + height, width = _get_width_height( + max_size, round(window.height), round(window.width) + ) + + height = height or round(window.height) + width = width or round(window.width) + + if buffer: + bounds, height, width = _apply_buffer(buffer, bounds, height, width) + window = windows.from_bounds(*bounds, transform=src_dst.transform) + + if padding > 0 and not is_aligned(src_dst, bounds, bounds_crs=dst_crs): + # For Padding we also use the buffer approach for non-VRT dataset + pad_bounds, height, width = _apply_buffer(padding, bounds, height, width) + window = windows.from_bounds(*pad_bounds, transform=src_dst.transform) + + img = read( + src_dst, + indexes=indexes, + width=width, + height=height, + window=window, + resampling_method=resampling_method, + force_binary_mask=force_binary_mask, + unscale=unscale, + post_process=post_process, + ) + return ImageData( + data=img.data[:, padding:-padding, padding:-padding], + mask=img.mask[padding:-padding, padding:-padding], + bounds=bounds, + crs=img.crs, + band_names=img.band_names, + dataset_statistics=img.dataset_statistics, + ) return read( src_dst, - out_height, - out_width, + indexes=indexes, + width=width, + height=height, window=window, - vrt_options=vrt_options, - **kwargs, + resampling_method=resampling_method, + force_binary_mask=force_binary_mask, + unscale=unscale, + post_process=post_process, ) -def preview( - src_dst: Union[DatasetReader, DatasetWriter, WarpedVRT], - max_size: int = 1024, - height: int = None, - width: int = None, - **kwargs: Any, -) -> DataMaskType: - """Read decimated version of a dataset. - - Args: - src_dst (rasterio.io.DatasetReader or rasterio.io.DatasetWriter or rasterio.vrt.WarpedVRT): Rasterio dataset. - max_size (int, optional): Limit output size array if not width and height. Defaults to `1024`. - height (int, optional): Output height of the array. - width (int, optional): Output width of the array. - kwargs (optional): Additional options to forward to `rio_tiler.reader.read`. - - Returns: - tuple: Data (numpy.ndarray) and Mask (numpy.ndarray) values. - - """ - if not height and not width: - if max(src_dst.height, src_dst.width) < max_size: - height, width = src_dst.height, src_dst.width - else: - ratio = src_dst.height / src_dst.width - if ratio > 1: - height = max_size - width = math.ceil(height / ratio) - else: - width = max_size - height = math.ceil(width * ratio) - - return read(src_dst, height, width, **kwargs) - - def point( src_dst: Union[DatasetReader, DatasetWriter, WarpedVRT], coordinates: Tuple[float, float], indexes: Optional[Indexes] = None, coord_crs: CRS = WGS84_CRS, - masked: bool = True, nodata: Optional[NoData] = None, - unscale: bool = False, - resampling_method: Resampling = "nearest", vrt_options: Optional[Dict] = None, + resampling_method: Resampling = "nearest", + unscale: bool = False, post_process: Optional[ Callable[[numpy.ndarray, numpy.ndarray], DataMaskType] ] = None, -) -> List: +) -> PointData: """Read a pixel value for a point. Args: @@ -284,55 +449,75 @@ def point( coordinates (tuple): Coordinates in form of (X, Y). indexes (sequence of int or int, optional): Band indexes. coord_crs (rasterio.crs.CRS, optional): Coordinate Reference System of the input coords. Defaults to `epsg:4326`. - masked (bool): Mask samples that fall outside the extent of the dataset. Defaults to `True`. nodata (int or float, optional): Overwrite dataset internal nodata value. - unscale (bool, optional): Apply 'scales' and 'offsets' on output data value. Defaults to `False`. - resampling_method (rasterio.enums.Resampling, optional): Rasterio's resampling algorithm. Defaults to `nearest`. vrt_options (dict, optional): Options to be passed to the rasterio.warp.WarpedVRT class. + resampling_method (rasterio.enums.Resampling, optional): Rasterio's resampling algorithm. Defaults to `nearest`. + unscale (bool, optional): Apply 'scales' and 'offsets' on output data value. Defaults to `False`. post_process (callable, optional): Function to apply on output data and mask values. Returns: - list: Pixel value per band indexes. + PointData """ if isinstance(indexes, int): indexes = (indexes,) - lon, lat = transform_coords( - coord_crs, src_dst.crs, [coordinates[0]], [coordinates[1]] - ) - if not ( - (src_dst.bounds[0] < lon[0] < src_dst.bounds[2]) - and (src_dst.bounds[1] < lat[0] < src_dst.bounds[3]) - ): - raise PointOutsideBounds("Point is outside dataset bounds") - - indexes = indexes if indexes is not None else src_dst.indexes - - vrt_params = dict(add_alpha=True, resampling=Resampling[resampling_method]) - nodata = nodata if nodata is not None else src_dst.nodata - if nodata is not None: - vrt_params.update(dict(nodata=nodata, add_alpha=False, src_nodata=nodata)) - - if has_alpha_band(src_dst): - vrt_params.update(dict(add_alpha=False)) - - if vrt_options: - vrt_params.update(vrt_options) - - with WarpedVRT(src_dst, **vrt_params) as vrt: - values = list(vrt.sample([(lon[0], lat[0])], indexes=indexes, masked=masked))[0] - point_values = values.data - mask = values.mask * 255 if masked else numpy.zeros(point_values.shape) - - if unscale: - point_values = point_values.astype("float32", casting="unsafe") - numpy.multiply( - point_values, src_dst.scales[0], out=point_values, casting="unsafe" - ) - numpy.add(point_values, src_dst.offsets[0], out=point_values, casting="unsafe") + with contextlib.ExitStack() as ctx: + # Use WarpedVRT when Re-projection or Nodata or User VRT Option (cutline) + if nodata is not None or vrt_options: + vrt_params = { + "add_alpha": True, + "resampling": Resampling[resampling_method], + } + nodata = nodata if nodata is not None else src_dst.nodata + if nodata is not None: + vrt_params.update( + {"nodata": nodata, "add_alpha": False, "src_nodata": nodata} + ) + + if has_alpha_band(src_dst): + vrt_params.update({"add_alpha": False}) - if post_process: - point_values, _ = post_process(point_values, mask) + if vrt_options: + vrt_params.update(**vrt_options) + + dataset = ctx.enter_context(WarpedVRT(src_dst, **vrt_params)) + + else: + dataset = src_dst + + lon, lat = transform_coords( + coord_crs, dataset.crs, [coordinates[0]], [coordinates[1]] + ) + if not ( + (dataset.bounds[0] < lon[0] < dataset.bounds[2]) + and (dataset.bounds[1] < lat[0] < dataset.bounds[3]) + ): + raise PointOutsideBounds("Point is outside dataset bounds") + + if indexes is None: + indexes = non_alpha_indexes(dataset) + + values = list(dataset.sample([(lon[0], lat[0])], indexes=indexes, masked=True))[ + 0 + ] + data = values.data + mask = ~values.mask * numpy.uint8(255) + + if unscale: + data = data.astype("float32", casting="unsafe") + numpy.multiply(data, dataset.scales[0], out=data, casting="unsafe") + numpy.add(data, dataset.offsets[0], out=data, casting="unsafe") + + if post_process: + data, _ = post_process(data, mask) + + pts = PointData( + data, + mask, + coordinates=coordinates, + crs=coord_crs, + band_names=[f"b{idx}" for idx in indexes], + ) - return point_values.tolist() + return pts diff --git a/rio_tiler/tasks.py b/rio_tiler/tasks.py index 87530b12..e8484f76 100644 --- a/rio_tiler/tasks.py +++ b/rio_tiler/tasks.py @@ -4,9 +4,9 @@ from functools import partial from typing import Any, Callable, Dict, Generator, Optional, Sequence, Tuple, Union -from .constants import MAX_THREADS -from .logger import logger -from .models import ImageData +from rio_tiler.constants import MAX_THREADS +from rio_tiler.logger import logger +from rio_tiler.models import ImageData, PointData TaskType = Sequence[Tuple[Union[futures.Future, Callable], Any]] @@ -72,6 +72,21 @@ def multi_arrays( ) +def multi_points( + asset_list: Sequence, + reader: Callable[..., PointData], + *args: Any, + threads: int = MAX_THREADS, + allowed_exceptions: Optional[Tuple] = None, + **kwargs: Any, +) -> PointData: + """Merge points returned from tasks.""" + tasks = create_tasks(reader, asset_list, threads, *args, **kwargs) + return PointData.create_from_list( + [data for data, _ in filter_tasks(tasks, allowed_exceptions=allowed_exceptions)] + ) + + def multi_values( asset_list: Sequence, reader: Callable, diff --git a/rio_tiler/utils.py b/rio_tiler/utils.py index 0a4ae31b..09700025 100644 --- a/rio_tiler/utils.py +++ b/rio_tiler/utils.py @@ -20,11 +20,11 @@ from rasterio.vrt import WarpedVRT from rasterio.warp import calculate_default_transform, transform_geom -from .colormap import apply_cmap -from .constants import WEB_MERCATOR_CRS -from .errors import RioTilerError -from .expression import get_expression_blocks -from .types import BBox, ColorMapType, IntervalTuple +from rio_tiler.colormap import apply_cmap +from rio_tiler.constants import WEB_MERCATOR_CRS +from rio_tiler.errors import RioTilerError +from rio_tiler.expression import get_expression_blocks +from rio_tiler.types import BBox, ColorMapType, IntervalTuple def _chunks(my_list: Sequence, chuck_size: int) -> Generator[Sequence, None, None]: @@ -67,6 +67,10 @@ def get_bands_names( count: Optional[int] = None, ) -> List[str]: """Define bands names based on expression, indexes or band count.""" + warnings.warn( + "`get_bands_names` is deprecated, and will be removed in rio-tiler 4.0`.", + DeprecationWarning, + ) if expression: return get_expression_blocks(expression) @@ -272,9 +276,7 @@ def get_vrt_transform( # If bounds window is aligned with the dataset internal tile we align the bounds with the pixels. # This is to limit the number of internal block fetched. - if _requested_tile_aligned_with_internal_tile( - src_dst, bounds, height, width, dst_crs - ): + if _requested_tile_aligned_with_internal_tile(src_dst, bounds, bounds_crs=dst_crs): # Get Window for the input bounds # e.g Window(col_off=17920.0, row_off=11007.999999999998, width=255.99999999999636, height=256.0000000000018) col_off, row_off, w, h = windows.from_bounds( @@ -374,16 +376,14 @@ def linear_rescale( """ imin, imax = in_range omin, omax = out_range - image = numpy.clip(image, imin, imax) - imin - image = image / numpy.float64(imax - imin) - return image * (omax - omin) + omin + im = numpy.clip(image, imin, imax) - imin + im = im / numpy.float64(imax - imin) + return im * (omax - omin) + omin def _requested_tile_aligned_with_internal_tile( src_dst: Union[DatasetReader, DatasetWriter, WarpedVRT], bounds: BBox, - height: Optional[int] = None, - width: Optional[int] = None, bounds_crs: CRS = WEB_MERCATOR_CRS, ) -> bool: """Check if tile is aligned with internal tiles.""" @@ -461,22 +461,20 @@ def render( elif img_format == "NPY": # If mask is not None we add it as the last band if mask is not None: - mask = numpy.expand_dims(mask, axis=0) - data = numpy.concatenate((data, mask)) + m = numpy.expand_dims(mask, axis=0) + data = numpy.concatenate((data, m)) - bio = BytesIO() - numpy.save(bio, data) - bio.seek(0) - return bio.getvalue() + with BytesIO() as bio: + numpy.save(bio, data) + return bio.getvalue() elif img_format == "NPZ": - bio = BytesIO() - if mask is not None: - numpy.savez_compressed(bio, data=data, mask=mask) - else: - numpy.savez_compressed(bio, data=data) - bio.seek(0) - return bio.getvalue() + with BytesIO() as bio: + if mask is not None: + numpy.savez_compressed(bio, data=data, mask=mask) + else: + numpy.savez_compressed(bio, data=data) + return bio.getvalue() count, height, width = data.shape @@ -659,3 +657,13 @@ def resize_array( indexes=indexes, resampling=Resampling[resampling_method], ) + + +def normalize_bounds(bounds: BBox) -> BBox: + """Return BBox in correct minx, miny, maxx, maxy order.""" + return ( + min(bounds[0], bounds[2]), + min(bounds[1], bounds[3]), + max(bounds[0], bounds[2]), + max(bounds[1], bounds[3]), + ) diff --git a/tests/benchmarks/test_benchmarks.py b/tests/benchmarks/test_benchmarks.py index 1f527a98..bcddfbd9 100644 --- a/tests/benchmarks/test_benchmarks.py +++ b/tests/benchmarks/test_benchmarks.py @@ -5,7 +5,7 @@ import pytest import rasterio -from rio_tiler.io import COGReader +from rio_tiler.io import Reader from . import benchmark_dataset, benchmark_tiles @@ -16,7 +16,7 @@ def read_tile(src_path, tile): """Benchmark rio-tiler.utils._tile_read.""" # We make sure to not store things in cache. with rasterio.Env(GDAL_CACHEMAX=0, NUM_THREADS="all"): - with COGReader(src_path, minzoom=0, maxzoom=24) as cog: + with Reader(src_path) as cog: return cog.tile(*tile) diff --git a/tests/fixtures/blue.tif b/tests/fixtures/blue.tif index ab527cb4..8f699011 100644 Binary files a/tests/fixtures/blue.tif and b/tests/fixtures/blue.tif differ diff --git a/tests/fixtures/cog_rgb.tif b/tests/fixtures/cog_rgb.tif new file mode 100644 index 00000000..8529b1b3 Binary files /dev/null and b/tests/fixtures/cog_rgb.tif differ diff --git a/tests/fixtures/green.tif b/tests/fixtures/green.tif index 002ed054..f7c9e16f 100644 Binary files a/tests/fixtures/green.tif and b/tests/fixtures/green.tif differ diff --git a/tests/fixtures/no_geo.jpg b/tests/fixtures/no_geo.jpg new file mode 100644 index 00000000..be29ec30 Binary files /dev/null and b/tests/fixtures/no_geo.jpg differ diff --git a/tests/fixtures/red.tif b/tests/fixtures/red.tif index 933bbc0b..bc527028 100644 Binary files a/tests/fixtures/red.tif and b/tests/fixtures/red.tif differ diff --git a/tests/fixtures/scene_b1.tif b/tests/fixtures/scene_band1.tif similarity index 100% rename from tests/fixtures/scene_b1.tif rename to tests/fixtures/scene_band1.tif diff --git a/tests/fixtures/scene_b2.tif b/tests/fixtures/scene_band2.tif similarity index 100% rename from tests/fixtures/scene_b2.tif rename to tests/fixtures/scene_band2.tif diff --git a/tests/test_io_MultiBand.py b/tests/test_io_MultiBand.py index 298c83cb..16a159bc 100644 --- a/tests/test_io_MultiBand.py +++ b/tests/test_io_MultiBand.py @@ -10,7 +10,7 @@ from rio_tiler.constants import WEB_MERCATOR_TMS from rio_tiler.errors import ExpressionMixingWarning, MissingBands -from rio_tiler.io import BaseReader, COGReader, MultiBandReader +from rio_tiler.io import BaseReader, MultiBandReader, Reader from rio_tiler.models import BandStatistics PREFIX = os.path.join(os.path.dirname(__file__), "fixtures") @@ -22,9 +22,20 @@ class BandFileReader(MultiBandReader): input: str = attr.ib() tms: morecantile.TileMatrixSet = attr.ib(default=WEB_MERCATOR_TMS) + + reader: Type[BaseReader] = attr.ib(init=False, default=Reader) reader_options: Dict = attr.ib(factory=dict) - reader: Type[BaseReader] = attr.ib(init=False, default=COGReader) + minzoom: int = attr.ib() + maxzoom: int = attr.ib() + + @minzoom.default + def _minzoom(self): + return self.tms.minzoom + + @maxzoom.default + def _maxzoom(self): + return self.tms.maxzoom def __attrs_post_init__(self): """Parse Sceneid and get grid bounds.""" @@ -48,86 +59,98 @@ def _get_band_url(self, band: str) -> str: def test_MultiBandReader(): """Should work as expected.""" with BandFileReader(PREFIX) as cog: - assert cog.bands == ["b1", "b2"] + assert cog.bands == ["band1", "band2"] assert cog.minzoom is not None assert cog.maxzoom is not None assert cog.bounds assert cog.bounds assert cog.crs - assert sorted(cog.parse_expression("b1/b2")) == ["b1", "b2"] + assert sorted(cog.parse_expression("band1/band2")) == ["band1", "band2"] with pytest.warns(UserWarning): meta = cog.info() - assert meta.band_descriptions == [("b1", ""), ("b2", "")] + assert meta.band_descriptions == [("band1", ""), ("band2", "")] - meta = cog.info(bands="b1") - assert meta.band_descriptions == [("b1", "")] + meta = cog.info(bands="band1") + assert meta.band_descriptions == [("band1", "")] - meta = cog.info(bands=("b1", "b2")) - assert meta.band_descriptions == [("b1", ""), ("b2", "")] + meta = cog.info(bands=("band1", "band2")) + assert meta.band_descriptions == [("band1", ""), ("band2", "")] with pytest.warns(UserWarning): stats = cog.statistics() - assert stats["b1"] - assert stats["b2"] + assert stats["band1"] + assert stats["band2"] - stats = cog.statistics(bands="b1") - assert "b1" in stats - assert isinstance(stats["b1"], BandStatistics) + stats = cog.statistics(bands="band1") + assert "band1" in stats + assert isinstance(stats["band1"], BandStatistics) - stats = cog.statistics(bands=("b1", "b2")) - assert stats["b1"] - assert stats["b2"] + stats = cog.statistics(bands=("band1", "band2")) + assert stats["band1"] + assert stats["band2"] - stats = cog.statistics(expression="b1;b1+b2;b1-100") - assert stats["b1"] - assert stats["b1+b2"] - assert stats["b1-100"] + stats = cog.statistics(expression="band1;band1+band2;band1-100") + assert stats["band1"] + assert stats["band1+band2"] + assert stats["band1-100"] with pytest.raises(MissingBands): cog.tile(238, 218, 9) - tile = cog.tile(238, 218, 9, bands="b1") + tile = cog.tile(238, 218, 9, bands="band1") assert tile.data.shape == (1, 256, 256) - assert tile.band_names == ["b1"] + assert tile.band_names == ["band1"] with pytest.warns(ExpressionMixingWarning): - tile = cog.tile(238, 218, 9, bands="b1", expression="b1*2") + tile = cog.tile(238, 218, 9, bands="band1", expression="band1*2") assert tile.data.shape == (1, 256, 256) - assert tile.band_names == ["b1*2"] + assert tile.band_names == ["band1*2"] with pytest.raises(MissingBands): cog.part((-11.5, 24.5, -11.0, 25.0)) - tile = cog.part((-11.5, 24.5, -11.0, 25.0), bands="b1") + tile = cog.part((-11.5, 24.5, -11.0, 25.0), bands="band1") assert tile.data.any() - assert tile.band_names == ["b1"] + assert tile.band_names == ["band1"] with pytest.warns(ExpressionMixingWarning): - tile = cog.part((-11.5, 24.5, -11.0, 25.0), bands="b1", expression="b1*2") + tile = cog.part( + (-11.5, 24.5, -11.0, 25.0), bands="band1", expression="band1*2" + ) assert tile.data.any() - assert tile.band_names == ["b1*2"] + assert tile.band_names == ["band1*2"] with pytest.raises(MissingBands): cog.preview() - tile = cog.preview(bands="b1") + tile = cog.preview(bands="band1") assert tile.data.any() - assert tile.band_names == ["b1"] + assert tile.band_names == ["band1"] with pytest.warns(ExpressionMixingWarning): - tile = cog.preview(bands="b1", expression="b1*2") + tile = cog.preview(bands="band1", expression="band1*2") assert tile.data.any() - assert tile.band_names == ["b1*2"] + assert tile.band_names == ["band1*2"] with pytest.raises(MissingBands): cog.point(-11.5, 24.5) - assert cog.point(-11.5, 24.5, bands="b1") + pt = cog.point(-11.5, 24.5, bands="band1") + assert len(pt.data) == 1 + assert pt.band_names == ["band1"] + + pt = cog.point(-11.5, 24.5, bands=("band1", "band2")) + assert len(pt.data) == 2 + assert pt.band_names == ["band1", "band2"] + + pt = cog.point(-11.5, 24.5, expression="band1/band2") + assert len(pt.data) == 1 + assert pt.band_names == ["band1/band2"] with pytest.warns(ExpressionMixingWarning): - assert cog.point(-11.5, 24.5, bands="b1", expression="b1*2") + assert cog.point(-11.5, 24.5, bands="band1", expression="band1*2") feat = { "type": "Feature", @@ -151,11 +174,11 @@ def test_MultiBandReader(): with pytest.raises(MissingBands): cog.feature(feat) - img = cog.feature(feat, bands="b1") + img = cog.feature(feat, bands="band1") assert img.data.any() assert not img.mask.all() - assert img.band_names == ["b1"] + assert img.band_names == ["band1"] with pytest.warns(ExpressionMixingWarning): - img = cog.feature(feat, bands="b1", expression="b1*2") - assert img.band_names == ["b1*2"] + img = cog.feature(feat, bands="band1", expression="band1*2") + assert img.band_names == ["band1*2"] diff --git a/tests/test_io_async.py b/tests/test_io_async.py deleted file mode 100644 index 3f982cb5..00000000 --- a/tests/test_io_async.py +++ /dev/null @@ -1,161 +0,0 @@ -"""Test Async BaseClass.""" - -import asyncio -import functools -import os -import typing -from typing import Any, Coroutine, Dict, List, Type - -import attr -import morecantile -import pytest - -from rio_tiler.constants import WEB_MERCATOR_TMS -from rio_tiler.io import AsyncBaseReader, COGReader -from rio_tiler.models import BandStatistics, ImageData, Info -from rio_tiler.types import BBox - -try: - import contextvars # Python 3.7+ only or via contextvars backport. -except ImportError: # pragma: no cover - contextvars = None # type: ignore - -T = typing.TypeVar("T") - -PREFIX = os.path.join(os.path.dirname(__file__), "fixtures") -COGEO = os.path.join(PREFIX, "cog_nodata.tif") - - -async def run_in_threadpool( - func: typing.Callable[..., T], *args: typing.Any, **kwargs: typing.Any -) -> T: - """Mock Sync function for Async call.Any - - Code from https://github.com/encode/starlette/blob/master/starlette/concurrency.py - """ - loop = asyncio.get_event_loop() - if contextvars is not None: # pragma: no cover - # Ensure we run in the same context - child = functools.partial(func, *args, **kwargs) - context = contextvars.copy_context() - func = context.run - args = (child,) - elif kwargs: # pragma: no cover - # loop.run_in_executor doesn't accept 'kwargs', so bind them in here - func = functools.partial(func, **kwargs) - return await loop.run_in_executor(None, func, *args) - - -@attr.s -class AsyncCOGReader(AsyncBaseReader): - - input: Type[COGReader] = attr.ib() - tms: morecantile.TileMatrixSet = attr.ib(default=WEB_MERCATOR_TMS) - - def __attrs_post_init__(self): - """Update dataset info.""" - self.bounds = self.input.bounds - self.crs = self.input.crs - self.minzoom = self.input.minzoom - self.maxzoom = self.input.maxzoom - - async def info(self) -> Coroutine[Any, Any, Info]: - """Return Dataset's info.""" - return await run_in_threadpool(self.input.info) # type: ignore - - async def statistics( - self, **kwargs: Any - ) -> Coroutine[Any, Any, Dict[str, BandStatistics]]: - """Return Dataset's statistics.""" - return await run_in_threadpool(self.input.statistics, **kwargs) # type: ignore - - async def tile( - self, tile_x: int, tile_y: int, tile_z: int, **kwargs: Any - ) -> Coroutine[Any, Any, ImageData]: - """Read a Map tile from the Dataset.""" - return await run_in_threadpool( - self.input.tile, tile_x, tile_y, tile_z, **kwargs # type: ignore - ) - - async def part(self, bbox: BBox, **kwargs: Any) -> Coroutine[Any, Any, ImageData]: - """Read a Part of a Dataset.""" - return await run_in_threadpool(self.input.part, bbox, **kwargs) # type: ignore - - async def preview(self, **kwargs: Any) -> Coroutine[Any, Any, ImageData]: - """Return a preview of a Dataset.""" - return await run_in_threadpool(self.input.preview, **kwargs) # type: ignore - - async def point( - self, lon: float, lat: float, **kwargs: Any - ) -> Coroutine[Any, Any, List]: - """Read a value from a Dataset.""" - return await run_in_threadpool(self.input.point, lon, lat, **kwargs) # type: ignore - - async def feature( - self, shape: Dict, **kwargs: Any - ) -> Coroutine[Any, Any, ImageData]: - """Read a Dataset for a GeoJSON feature""" - return await run_in_threadpool(self.input.feature, shape, **kwargs) # type: ignore - - -@pytest.mark.asyncio -async def test_async(): - dataset = COGReader(COGEO) - - async with AsyncCOGReader(dataset) as cog: - info = await cog.info() - assert info == dataset.info() - - assert cog.minzoom == 5 - assert cog.maxzoom == 9 - - stat = await cog.statistics() - assert stat == dataset.statistics() - - data, mask = await cog.tile(43, 24, 7) - assert data.shape == (1, 256, 256) - assert mask.all() - - lon = -56.624124590533825 - lat = 73.52687881825946 - pts = await cog.point(lon, lat) - assert len(pts) == 1 - - bbox = ( - -56.624124590533825, - 73.50183615350426, - -56.530950796449005, - 73.52687881825946, - ) - data, mask = await cog.part(bbox) - assert data.shape == (1, 11, 40) - - data, mask = await cog.preview(max_size=128) - assert data.shape == (1, 128, 128) - - feature = { - "type": "Feature", - "properties": {}, - "geometry": { - "type": "Polygon", - "coordinates": [ - [ - [-56.4697265625, 74.17307693616263], - [-57.667236328125, 73.53462847039683], - [-57.59033203125, 73.13451013251789], - [-56.195068359375, 72.94865294642922], - [-54.964599609375, 72.96797135377102], - [-53.887939453125, 73.84623016391944], - [-53.97583007812499, 74.0165183926664], - [-54.73388671875, 74.23289305339864], - [-55.54687499999999, 74.2269213699517], - [-56.129150390625, 74.21497138945001], - [-56.2060546875, 74.21198251594369], - [-56.4697265625, 74.17307693616263], - ] - ], - }, - } - - img = await cog.feature(feature, max_size=1024) - assert img.data.shape == (1, 348, 1024) diff --git a/tests/test_io_image.py b/tests/test_io_image.py new file mode 100644 index 00000000..d9f14c7d --- /dev/null +++ b/tests/test_io_image.py @@ -0,0 +1,163 @@ +import os +import warnings + +import numpy +import pytest +from rasterio.errors import NotGeoreferencedWarning + +from rio_tiler.errors import PointOutsideBounds, TileOutsideBounds +from rio_tiler.io.rasterio import ImageReader + +PREFIX = os.path.join(os.path.dirname(__file__), "fixtures") +NO_GEO = os.path.join(PREFIX, "no_geo.jpg") +GEO = os.path.join(PREFIX, "cog_nonearth.tif") + + +def test_non_geo_image(): + """Test COGReader usage with Non-Geo Images.""" + with pytest.warns() as w: + with ImageReader(NO_GEO) as src: + assert src.minzoom == 0 + assert src.maxzoom == 3 + assert len(w) == 1 + assert issubclass(w[0].category, NotGeoreferencedWarning) + + with warnings.catch_warnings(): + with ImageReader(NO_GEO) as src: + assert list(src.tms.xy_bounds(0, 0, 3)) == [0, 256, 256, 0] + assert list(src.tms.xy_bounds(0, 0, 2)) == [0, 512, 512, 0] + assert list(src.tms.xy_bounds(0, 0, 1)) == [0, 1024, 1024, 0] + assert list(src.tms.xy_bounds(0, 0, 0)) == [0, 2048, 2048, 0] + + img = src.tile(0, 0, 3) + assert img.mask.all() + + # Make sure no resampling was done at full resolution + data = src.dataset.read(window=((0, 256), (0, 256))) + numpy.testing.assert_array_equal(data, img.data) + + # Tile at zoom 0 should have masked part + img = src.tile(0, 0, 0) + assert not img.mask.all() + + with pytest.raises(TileOutsideBounds): + max_x_tile = src.dataset.width // 256 + 1 + max_y_tile = src.dataset.height // 256 + 1 + src.tile(max_x_tile, max_y_tile, 3) + + img = src.part((0, 256, 256, 0)) + data = src.dataset.read(window=((0, 256), (0, 256))) + numpy.testing.assert_array_equal(data, img.data) + + img = src.preview() + assert img.width == 1024 + assert img.height == 1024 + + pt = src.point(0, 0) + assert len(pt.mask) == 1 + assert pt.mask[0] == 255 + data = list(src.dataset.sample([(0, 0)]))[0] + numpy.testing.assert_array_equal(pt.data, data) + + pt = src.point(1999, 1999) + data = list(src.dataset.sample([(1999, 1999)]))[0] + numpy.testing.assert_array_equal(pt.data, data) + + with pytest.raises(PointOutsideBounds): + src.point(2000, 2000) + + poly = { + "coordinates": [ + [ + [-100.0, -100.0], + [1000.0, 100.0], + [500.0, 1000.0], + [-50.0, 500.0], + [-100.0, -100.0], + ] + ], + "type": "Polygon", + } + im = src.feature(poly) + assert im.data.shape == (3, 1100, 1100) + + +def test_with_geo_image(): + """Test ImageReader usage with Geo Images.""" + with ImageReader(GEO) as src: + assert src.minzoom == 0 + assert src.maxzoom == 2 + + assert list(src.tms.xy_bounds(0, 0, 2)) == [0, 256, 256, 0] + assert list(src.tms.xy_bounds(0, 0, 1)) == [0, 512, 512, 0] + assert list(src.tms.xy_bounds(0, 0, 0)) == [0, 1024, 1024, 0] + + img = src.tile(10, 12, 4) + assert img.mask.all() + # img should keep the geo information from the dataset + assert img.crs == src.dataset.crs + assert img.bounds != list(src.tms.xy_bounds(10, 12, 4)) + + img = src.tile(0, 0, 3) + assert not img.mask.any() + + # Make sure no resampling was done at full resolution + data = src.dataset.read(window=((0, 256), (0, 256))) + numpy.testing.assert_array_equal(data, img.data) + + # Tile at zoom 0 should have masked part + img = src.tile(0, 0, 0) + assert not img.mask.all() + + with pytest.raises(TileOutsideBounds): + max_x_tile = src.dataset.width // 256 + 1 + max_y_tile = src.dataset.height // 256 + 1 + src.tile(max_x_tile, max_y_tile, 2) + + img = src.part((0, 256, 256, 0)) + data = src.dataset.read(window=((0, 256), (0, 256))) + numpy.testing.assert_array_equal(data, img.data) + + img = src.preview() + assert img.width == 921 + assert img.height == 884 + # img should keep the geo information from the dataset + assert img.crs == src.dataset.crs + assert img.bounds != list(src.tms.xy_bounds(10, 12, 4)) + + pt = src.point(0, 0) + # pixel 0,0 is masked + assert len(pt.mask) == 1 + assert pt.mask[0] == 0 + + data = list(src.dataset.sample([(0, 0)]))[0] + numpy.testing.assert_array_equal(pt.data, data) + + pt = src.point(400, 800) + # pixel 400,800 has valid values + assert len(pt.mask) == 1 + assert pt.mask[0] == 255 + + pt = src.point(920, 883) + data = list(src.dataset.sample([(920, 883)]))[0] + numpy.testing.assert_array_equal(pt.data, data) + assert pt.crs == src.dataset.crs + assert pt.coordinates != [920, 883] + + with pytest.raises(PointOutsideBounds): + src.point(2000, 2000) + + poly = { + "coordinates": [ + [ + [-100.0, -100.0], + [1000.0, 100.0], + [500.0, 1000.0], + [-50.0, 500.0], + [-100.0, -100.0], + ] + ], + "type": "Polygon", + } + im = src.feature(poly) + assert im.data.shape == (1, 1100, 1100) diff --git a/tests/test_io_cogeo.py b/tests/test_io_rasterio.py similarity index 73% rename from tests/test_io_cogeo.py rename to tests/test_io_rasterio.py index 8515c101..70a637d5 100644 --- a/tests/test_io_cogeo.py +++ b/tests/test_io_rasterio.py @@ -1,6 +1,7 @@ -"""tests rio_tiler.io.cogeo.COGReader""" +"""tests rio_tiler.io.rasterio.Reader""" import os +import warnings from io import BytesIO from typing import Any, Dict @@ -12,19 +13,18 @@ from morecantile import TileMatrixSet from pyproj import CRS from rasterio import transform -from rasterio.io import DatasetReader, MemoryFile +from rasterio.io import MemoryFile from rasterio.vrt import WarpedVRT from rasterio.warp import transform_bounds from rio_tiler.constants import WEB_MERCATOR_TMS, WGS84_CRS from rio_tiler.errors import ( - AlphaBandWarning, ExpressionMixingWarning, - IncorrectTileBuffer, + InvalidBufferSize, NoOverviewWarning, TileOutsideBounds, ) -from rio_tiler.io import COGReader, GCPCOGReader +from rio_tiler.io import Reader from rio_tiler.models import BandStatistics PREFIX = os.path.join(os.path.dirname(__file__), "fixtures") @@ -54,42 +54,29 @@ def test_spatial_info_valid(): """Should work as expected (get spatial info)""" - with COGReader(COG_NODATA) as cog: + with Reader(COG_NODATA) as cog: assert not cog.dataset.closed assert cog.bounds assert cog.crs assert cog.minzoom == 5 assert cog.maxzoom == 9 - assert cog.nodata == cog.dataset.nodata assert cog.dataset.closed - cog = COGReader(COG_NODATA) + cog = Reader(COG_NODATA) assert not cog.dataset.closed cog.close() assert cog.dataset.closed - with COGReader(COG_NODATA, minzoom=3) as cog: - assert cog.minzoom == 3 - assert cog.maxzoom == 9 - - with COGReader(COG_NODATA, maxzoom=12) as cog: - assert cog.minzoom == 5 - assert cog.maxzoom == 12 - - with COGReader(COG_NODATA, minzoom=3, maxzoom=12) as cog: - assert cog.minzoom == 3 - assert cog.maxzoom == 12 - def test_bounds_valid(): """Should work as expected (get bounds)""" - with COGReader(COG_NODATA) as cog: + with Reader(COG_NODATA) as cog: assert len(cog.bounds) == 4 def test_info_valid(): """Should work as expected (get file info)""" - with COGReader(COG_SCALE) as cog: + with Reader(COG_SCALE) as cog: meta = cog.info() assert meta["scale"] assert meta.scale @@ -101,19 +88,19 @@ def test_info_valid(): assert meta.overviews assert meta.driver - with COGReader(COG_CMAP) as cog: + with Reader(COG_CMAP) as cog: assert cog.colormap meta = cog.info() assert meta["colormap"] assert meta.colormap - with COGReader(COG_NODATA, colormap={1: (0, 0, 0, 0)}) as cog: + with Reader(COG_NODATA, colormap={1: (0, 0, 0, 0)}) as cog: assert cog.colormap meta = cog.info() assert meta.colormap assert meta.nodata_value - with COGReader(COG_TAGS) as cog: + with Reader(COG_TAGS) as cog: meta = cog.info() assert meta.bounds assert meta.minzoom @@ -126,34 +113,34 @@ def test_info_valid(): assert meta.offset assert meta.band_metadata band_meta = meta.band_metadata[0] - assert band_meta[0] == "1" + assert band_meta[0] == "b1" assert "STATISTICS_MAXIMUM" in band_meta[1] - with COGReader(COG_ALPHA) as cog: + with Reader(COG_ALPHA) as cog: meta = cog.info() assert meta.nodata_type == "Alpha" - with COGReader(COG_MASK) as cog: + with Reader(COG_MASK) as cog: meta = cog.info() assert meta.nodata_type == "Mask" - with COGReader(COGEO) as cog: + with Reader(COGEO) as cog: meta = cog.info() assert meta.nodata_type == "None" - with COGReader(COG_NODATA) as cog: + with Reader(COG_NODATA) as cog: meta = cog.info() assert meta.nodata_type == "Nodata" def test_tile_valid_default(): """Should return a 3 bands array and a full valid mask.""" - with COGReader(COG_NODATA) as cog: + with Reader(COG_NODATA) as cog: # Full tile img = cog.tile(43, 24, 7) assert img.data.shape == (1, 256, 256) assert img.mask.all() - assert img.band_names == ["1"] + assert img.band_names == ["b1"] # Validate that Tile and Part gives the same result tile_bounds = WEB_MERCATOR_TMS.xy_bounds(43, 24, 7) @@ -194,12 +181,12 @@ def test_tile_valid_default(): ), ) assert img.data.shape == (2, 256, 256) - assert img.band_names == ["1", "1"] + assert img.band_names == ["b1", "b1"] # We are using a file that is aligned with the grid so no resampling should be involved - with COGReader(COG_WEB) as cog: + with Reader(COG_WEB) as cog: img = cog.tile(147, 182, 9) - img_buffer = cog.tile(147, 182, 9, tile_buffer=10) + img_buffer = cog.tile(147, 182, 9, buffer=10) assert img_buffer.width == 276 assert img_buffer.height == 276 assert not img.bounds == img_buffer.bounds @@ -209,31 +196,31 @@ def test_tile_valid_default(): def test_tile_invalid_bounds(): """Should raise an error with invalid tile.""" with pytest.raises(TileOutsideBounds): - with COGReader(COGEO) as cog: + with Reader(COGEO) as cog: cog.tile(38, 24, 7) def test_tile_with_incorrect_float_buffer(): - with pytest.raises(IncorrectTileBuffer): - with COGReader(COGEO) as cog: - cog.tile(43, 24, 7, tile_buffer=0.8) + with pytest.raises(InvalidBufferSize): + with Reader(COGEO) as cog: + cog.tile(43, 24, 7, buffer=0.8) def test_tile_with_int_buffer(): - with COGReader(COGEO) as cog: - data, mask = cog.tile(43, 24, 7, tile_buffer=1) + with Reader(COGEO) as cog: + data, mask = cog.tile(43, 24, 7, buffer=1) assert data.shape == (1, 258, 258) assert mask.all() - with COGReader(COGEO) as cog: - data, mask = cog.tile(43, 24, 7, tile_buffer=0) + with Reader(COGEO) as cog: + data, mask = cog.tile(43, 24, 7, buffer=0) assert data.shape == (1, 256, 256) assert mask.all() def test_tile_with_correct_float_buffer(): - with COGReader(COGEO) as cog: - data, mask = cog.tile(43, 24, 7, tile_buffer=0.5) + with Reader(COGEO) as cog: + data, mask = cog.tile(43, 24, 7, buffer=0.5) assert data.shape == (1, 257, 257) assert mask.all() @@ -242,21 +229,28 @@ def test_point_valid(): """Read point.""" lon = -56.624124590533825 lat = 73.52687881825946 - with COGReader(COG_NODATA) as cog: - pts = cog.point(lon, lat) - assert len(pts) == 1 - - pts = cog.point(lon, lat, expression="b1*2;b1-100") - assert len(pts) == 2 + with Reader(COG_NODATA) as cog: + pt = cog.point(lon, lat) + assert len(pt.data) == 1 + assert len(pt.mask) == 1 + assert pt.band_names == ["b1"] + + pt = cog.point(lon, lat, expression="b1*2;b1-100") + assert len(pt.data) == 2 + assert len(pt.mask) == 1 + assert pt.mask[0] == 255 + assert pt.band_names == ["b1*2", "b1-100"] with pytest.warns(ExpressionMixingWarning): - pts = cog.point(lon, lat, indexes=(1, 2, 3), expression="b1*2") - assert len(pts) == 1 + pt = cog.point(lon, lat, indexes=(1, 2, 3), expression="b1*2") + assert len(pt.data) == 1 + assert pt.band_names == ["b1*2"] - pts = cog.point(lon, lat, indexes=1) - assert len(pts) == 1 + pt = cog.point(lon, lat, indexes=1) + assert len(pt.data) == 1 + assert pt.band_names == ["b1"] - pts = cog.point( + pt = cog.point( lon, lat, indexes=( @@ -264,7 +258,13 @@ def test_point_valid(): 1, ), ) - assert len(pts) == 2 + assert len(pt.data) == 2 + assert pt.band_names == ["b1", "b1"] + + pt = cog.point(-59.53, 74.03, indexes=(1, 1, 1)) + assert len(pt.data) == 3 + assert pt.mask[0] == 0 + assert pt.band_names == ["b1", "b1", "b1"] def test_area_valid(): @@ -275,10 +275,10 @@ def test_area_valid(): -56.530950796449005, 73.52687881825946, ) - with COGReader(COG_NODATA) as cog: + with Reader(COG_NODATA) as cog: img = cog.part(bbox) assert img.data.shape == (1, 11, 40) - assert img.band_names == ["1"] + assert img.band_names == ["b1"] data, mask = cog.part(bbox, dst_crs=cog.dataset.crs) assert data.shape == (1, 28, 30) @@ -306,15 +306,15 @@ def test_area_valid(): ), ) assert img.data.shape == (2, 11, 40) - assert img.band_names == ["1", "1"] + assert img.band_names == ["b1", "b1"] def test_preview_valid(): """Read preview.""" - with COGReader(COGEO) as cog: + with Reader(COGEO) as cog: img = cog.preview(max_size=128) assert img.data.shape == (1, 128, 128) - assert img.band_names == ["1"] + assert img.band_names == ["b1"] data, mask = cog.preview() assert data.shape == (1, 1024, 1021) @@ -339,29 +339,29 @@ def test_preview_valid(): ), ) assert img.data.shape == (2, 128, 128) - assert img.band_names == ["1", "1"] + assert img.band_names == ["b1", "b1"] def test_statistics(): """tests statistics method.""" - with COGReader(COGEO) as cog: + with Reader(COGEO) as cog: stats = cog.statistics() assert len(stats) == 1 - assert isinstance(stats["1"], BandStatistics) - assert stats["1"].percentile_2 - assert stats["1"].percentile_98 + assert isinstance(stats["b1"], BandStatistics) + assert stats["b1"].percentile_2 + assert stats["b1"].percentile_98 - with COGReader(COGEO) as cog: + with Reader(COGEO) as cog: stats = cog.statistics(percentiles=[3]) - assert stats["1"].percentile_3 + assert stats["b1"].percentile_3 - with COGReader(COGEO) as cog: + with Reader(COGEO) as cog: stats = cog.statistics(percentiles=[3]) - assert stats["1"].percentile_3 + assert stats["b1"].percentile_3 - with COGReader(COG_CMAP) as cog: + with Reader(COG_CMAP) as cog: stats = cog.statistics(categorical=True) - assert stats["1"].histogram[1] == [ + assert stats["b1"].histogram[1] == [ 1.0, 3.0, 4.0, @@ -376,56 +376,56 @@ def test_statistics(): ] stats = cog.statistics(categorical=True, categories=[1, 3]) - assert stats["1"].histogram[1] == [ + assert stats["b1"].histogram[1] == [ 1.0, 3.0, ] # make sure kwargs are passed to `preview` - with COGReader(COGEO) as cog: + with Reader(COGEO) as cog: stats = cog.statistics(width=100, height=100, max_size=None) - assert stats["1"].count == 10000.0 + assert stats["b1"].count == 10000.0 # Check results for expression - with COGReader(COGEO) as cog: + with Reader(COGEO) as cog: stats = cog.statistics(expression="b1;b1*2") assert stats["b1"] assert stats["b1*2"] assert stats["b1"].min == stats["b1*2"].min / 2 -def test_COGReader_Options(): +def test_Reader_Options(): """Set options in reader.""" - with COGReader(COGEO, nodata=1) as cog: - assert cog.nodata == 1 + with Reader(COGEO, options={"nodata": 1}) as cog: + assert cog.info().nodata_value == 1 + assert cog.info().nodata_type == "Nodata" - with COGReader(COGEO) as cog: - assert not cog.nodata + with Reader(COGEO) as cog: assert cog.info().nodata_type == "None" - with COGReader(COGEO, nodata=1) as cog: + with Reader(COGEO, options={"nodata": 1}) as cog: _, mask = cog.tile(43, 25, 7) assert not mask.all() # read cog using default Nearest - with COGReader(COGEO, nodata=1) as cog: + with Reader(COGEO, options={"nodata": 1}) as cog: data_default, _ = cog.tile(43, 25, 7) # read cog using bilinear - with COGReader(COGEO, nodata=1, resampling_method="bilinear") as cog: + with Reader(COGEO, options={"nodata": 1, "resampling_method": "bilinear"}) as cog: data, _ = cog.tile(43, 25, 7) assert not numpy.array_equal(data_default, data) - with COGReader(COG_SCALE, unscale=True) as cog: + with Reader(COG_SCALE, options={"unscale": True}) as cog: p = cog.point(310000, 4100000, coord_crs=cog.dataset.crs) - assert round(p[0], 3) == 1000.892 + assert round(float(p.data[0]), 3) == 1000.892 # passing unscale in method should overwrite the defaults p = cog.point(310000, 4100000, coord_crs=cog.dataset.crs, unscale=False) - assert p[0] == 8917 + assert p.data[0] == 8917 cutline = "POLYGON ((13 1685, 1010 6, 2650 967, 1630 2655, 13 1685))" - with COGReader(COGEO, vrt_options={"cutline": cutline}) as cog: + with Reader(COGEO, options={"vrt_options": {"cutline": cutline}}) as cog: _, mask = cog.preview() assert not mask.all() @@ -434,7 +434,7 @@ def callback(data, mask): data = data * 2 return data, mask - with COGReader(COGEO, nodata=1, post_process=callback) as cog: + with Reader(COGEO, options={"nodata": 1, "post_process": callback}) as cog: data_init, _ = cog.tile(43, 25, 7, post_process=None) data, mask = cog.tile(43, 25, 7) assert mask.all() @@ -442,70 +442,19 @@ def callback(data, mask): lon = -56.624124590533825 lat = 73.52687881825946 - with COGReader(COG_NODATA, post_process=callback) as cog: - pts = cog.point(lon, lat) + with Reader(COG_NODATA, options={"post_process": callback}) as cog: + pt = cog.point(lon, lat) - with COGReader(COG_NODATA) as cog: - pts_init = cog.point(lon, lat) - assert pts[0] == pts_init[0] * 2 + with Reader(COG_NODATA) as cog: + pt_init = cog.point(lon, lat) + assert pt.data[0] == pt_init.data[0] * 2 def test_cog_with_internal_gcps(): """Make sure file gets re-projected using gcps.""" - with pytest.warns(DeprecationWarning): - with GCPCOGReader(COG_GCPS, nodata=0) as cog: - assert cog.bounds - assert cog.nodata == 0 - assert isinstance(cog.src_dataset, DatasetReader) - assert isinstance(cog.dataset, WarpedVRT) - - assert cog.minzoom == 7 - assert cog.maxzoom == 10 - - metadata = cog.info() - assert len(metadata.band_metadata) == 1 - assert metadata.band_descriptions == [("1", "")] - - tile_z = 8 - tile_x = 183 - tile_y = 120 - data, mask = cog.tile(tile_x, tile_y, tile_z) - assert data.shape == (1, 256, 256) - assert mask.shape == (256, 256) - - # https://github.com/rasterio/rasterio/issues/2092 - # assert cog.dataset.closed - assert cog.src_dataset.closed - - with pytest.warns(DeprecationWarning): - with rasterio.open(COG_GCPS) as dst: - with GCPCOGReader(None, src_dataset=dst, nodata=0) as cog: - assert cog.bounds - assert cog.nodata == 0 - assert isinstance(cog.src_dataset, DatasetReader) - assert isinstance(cog.dataset, WarpedVRT) - - assert cog.minzoom == 7 - assert cog.maxzoom == 10 - - metadata = cog.info() - assert len(metadata.band_metadata) == 1 - assert metadata.band_descriptions == [("1", "")] - - tile_z = 8 - tile_x = 183 - tile_y = 120 - data, mask = cog.tile(tile_x, tile_y, tile_z) - assert data.shape == (1, 256, 256) - assert mask.shape == (256, 256) - # https://github.com/rasterio/rasterio/issues/2092 - # assert cog.dataset.closed - assert not cog.src_dataset.closed - assert cog.src_dataset.closed - - with COGReader(COG_GCPS, nodata=0) as cog: + with Reader(COG_GCPS, options={"nodata": 0}) as cog: assert cog.bounds - assert cog.nodata == 0 + assert cog.info().nodata_value == 0 assert isinstance(cog.dataset, WarpedVRT) assert cog.minzoom == 7 @@ -513,7 +462,7 @@ def test_cog_with_internal_gcps(): metadata = cog.info() assert len(metadata.band_metadata) == 1 - assert metadata.band_descriptions == [("1", "")] + assert metadata.band_descriptions == [("b1", "")] tile_z = 8 tile_x = 183 @@ -531,9 +480,9 @@ def test_cog_with_internal_gcps(): src_crs=dst.gcps[1], src_transform=transform.from_gcps(dst.gcps[0]), ) as vrt: - with COGReader(None, dataset=vrt, nodata=0) as cog: + with Reader(None, dataset=vrt, options={"nodata": 0}) as cog: assert cog.bounds - assert cog.nodata == 0 + assert cog.info().nodata_value == 0 assert isinstance(cog.dataset, WarpedVRT) assert cog.minzoom == 7 @@ -541,7 +490,7 @@ def test_cog_with_internal_gcps(): metadata = cog.info() assert len(metadata.band_metadata) == 1 - assert metadata.band_descriptions == [("1", "")] + assert metadata.band_descriptions == [("b1", "")] tile_z = 8 tile_x = 183 @@ -566,7 +515,7 @@ def parse_img(content: bytes) -> Dict[Any, Any]: def test_imageData_output(): """Test ImageData output.""" - with COGReader(COG_NODATA) as cog: + with Reader(COG_NODATA) as cog: img = cog.tile(43, 24, 7) assert img.data.shape == (1, 256, 256) assert img.mask.all() @@ -636,9 +585,12 @@ def test_imageData_output(): img = cog.preview(max_size=128) assert img.data.shape == (1, 128, 128) - assert img.bounds == cog.dataset.bounds meta = parse_img(img.render(img_format="GTiff")) assert meta["crs"] == cog.dataset.crs + # Bounds should be the same but VRT might introduce some rounding issue + for x, y in zip(img.bounds, cog.dataset.bounds): + assert round(x, 5) == round(y, 5) + # assert img.bounds == cog.dataset.bounds def test_feature_valid(): @@ -667,10 +619,10 @@ def test_feature_valid(): }, } - with COGReader(COG_NODATA) as cog: + with Reader(COG_NODATA) as cog: img = cog.feature(feature, max_size=1024) assert img.data.shape == (1, 348, 1024) - assert img.band_names == ["1"] + assert img.band_names == ["b1"] img = cog.feature(feature, dst_crs=cog.dataset.crs, max_size=1024) assert img.data.shape == (1, 1024, 869) @@ -701,7 +653,7 @@ def test_feature_valid(): max_size=1024, ) assert img.data.shape == (2, 348, 1024) - assert img.band_names == ["1", "1"] + assert img.band_names == ["b1", "b1"] # feature overlaping on mask area mask_feat = { @@ -748,12 +700,12 @@ def test_feature_valid(): def test_tiling_ignores_padding_if_web_friendly_internal_tiles_exist(): """Ignore Padding when COG is aligned.""" - with COGReader(COG_WEB) as cog: + with Reader(COG_WEB) as cog: img = cog.tile(147, 182, 9, padding=0, resampling_method="bilinear") img2 = cog.tile(147, 182, 9, padding=100, resampling_method="bilinear") assert numpy.array_equal(img.data, img2.data) - with COGReader(COGEO) as cog: + with Reader(COGEO) as cog: img = cog.tile(43, 24, 7, padding=0, resampling_method="bilinear") img2 = cog.tile(43, 24, 7, padding=100, resampling_method="bilinear") assert not numpy.array_equal(img.data, img2.data) @@ -762,22 +714,21 @@ def test_tiling_ignores_padding_if_web_friendly_internal_tiles_exist(): def test_tile_read_alpha(): """Read masked area.""" # non-boundless tile covering the alpha masked part - with COGReader(COG_ALPHA) as cog: - with pytest.warns(AlphaBandWarning): - nb = cog.dataset.count - img = cog.tile(876432, 1603670, 22) - assert ( - not nb == img.count - ) # rio-tiler removes the alpha band from the `data` array - assert img.data.shape == (3, 256, 256) - assert not img.mask.all() + with Reader(COG_ALPHA) as cog: + nb = cog.dataset.count + img = cog.tile(876432, 1603670, 22) + assert ( + not nb == img.count + ) # rio-tiler removes the alpha band from the `data` array + assert img.data.shape == (3, 256, 256) + assert not img.mask.all() def test_tile_read_mask(): """Read masked area.""" with rasterio.Env(GDAL_DISABLE_READDIR_ON_OPEN="EMPTY_DIR"): # non-boundless tile covering the masked part - with COGReader(COG_MASK) as cog: + with Reader(COG_MASK) as cog: img = cog.tile(876431, 1603669, 22, tilesize=16) assert img.data.shape == (3, 16, 16) assert img.mask.shape == (16, 16) @@ -793,7 +744,7 @@ def test_tile_read_extmask(): """Read masked area.""" # non-boundless tile covering the masked part with rasterio.Env(GDAL_DISABLE_READDIR_ON_OPEN="TRUE"): - with COGReader(COG_EXTMASK) as cog: + with Reader(COG_EXTMASK) as cog: img = cog.tile(876431, 1603669, 22) assert img.data.shape == (3, 256, 256) assert img.mask.shape == (256, 256) @@ -802,7 +753,7 @@ def test_tile_read_extmask(): def test_dateline(): """Read tile from data crossing the antimeridian.""" - with COGReader(COG_DLINE) as cog: + with Reader(COG_DLINE) as cog: img = cog.tile(0, 84, 8, tilesize=64) assert img.data.shape == (1, 64, 64) @@ -812,23 +763,21 @@ def test_dateline(): def test_fullEarth(): """Should read tile for COG spanning the whole earth.""" - with COGReader(COG_EARTH) as cog: + with Reader(COG_EARTH) as cog: img = cog.tile(1, 42, 7, tilesize=64) assert img.data.shape == (1, 64, 64) img = cog.tile(127, 42, 7, tilesize=64) assert img.data.shape == (1, 64, 64) - with COGReader( - COG_EARTH, tms=morecantile.tms.get("EuropeanETRS89_LAEAQuad") - ) as cog: + with Reader(COG_EARTH, tms=morecantile.tms.get("EuropeanETRS89_LAEAQuad")) as cog: img = cog.tile(0, 0, 1, tilesize=64) assert img.data.shape == (1, 64, 64) def test_read(): """Should read the entire dataset.""" - with COGReader(COGEO) as cog: + with Reader(COGEO) as cog: img = cog.read() assert numpy.array_equal(img.data, cog.dataset.read(indexes=(1,))) assert img.width == cog.dataset.width @@ -854,21 +803,24 @@ def test_read(): def test_no_overviews(): """Should warns when no overviews are found.""" with pytest.warns(NoOverviewWarning): - with COGReader(GEOTIFF): + with Reader(GEOTIFF): pass def test_nonearthbody(): - """COGReader should work with non-earth dataset.""" + """Reader should work with non-earth dataset.""" + EUROPA_SPHERE = CRS.from_proj4("+proj=longlat +R=1560800 +no_defs") + with pytest.warns(UserWarning): - with COGReader(COG_EUROPA) as cog: + with Reader(COG_EUROPA) as cog: assert cog.minzoom == 0 assert cog.maxzoom == 24 - with pytest.warns(None) as warnings: - with COGReader(COG_EUROPA) as cog: + # Warns because of zoom level in WebMercator can't be defined + with pytest.warns(UserWarning) as w: + with Reader(COG_EUROPA, geographic_crs=EUROPA_SPHERE) as cog: assert cog.info() - assert len(warnings) == 2 + assert len(w) == 2 img = cog.read() assert numpy.array_equal(img.data, cog.dataset.read(indexes=(1,))) @@ -884,29 +836,29 @@ def test_nonearthbody(): lon = (cog.bounds[0] + cog.bounds[2]) / 2 lat = (cog.bounds[1] + cog.bounds[3]) / 2 - assert cog.point(lon, lat, coord_crs=cog.crs)[0] is not None + assert cog.point(lon, lat, coord_crs=cog.crs).data[0] is not None - europa_crs = CRS.from_authority("ESRI", 104915) - tms = TileMatrixSet.custom( - crs=europa_crs, - extent=europa_crs.area_of_use.bounds, - matrix_scale=[2, 1], - ) - with pytest.warns(None) as warnings: - with COGReader(COG_EUROPA, tms=tms) as cog: - assert cog.minzoom == 4 - assert cog.maxzoom == 6 + with pytest.warns(UserWarning): + europa_crs = CRS.from_authority("ESRI", 104915) + tms = TileMatrixSet.custom( + crs=europa_crs, + extent=europa_crs.area_of_use.bounds, + matrix_scale=[2, 1], + ) - # Get Tile covering the UL corner - bounds = transform_bounds(cog.crs, tms.rasterio_crs, *cog.bounds) - t = tms._tile(bounds[0], bounds[1], cog.minzoom) - img = cog.tile(t.x, t.y, t.z) + with Reader(COG_EUROPA, tms=tms, geographic_crs=EUROPA_SPHERE) as cog: + assert cog.info() + assert cog.minzoom == 4 + assert cog.maxzoom == 6 - assert img.height == 256 - assert img.width == 256 - assert img.crs == tms.rasterio_crs + # Get Tile covering the UL corner + bounds = transform_bounds(cog.crs, tms.rasterio_crs, *cog.bounds) + t = tms._tile(bounds[0], bounds[1], cog.minzoom) + img = cog.tile(t.x, t.y, t.z) - assert len(warnings) == 0 + assert img.height == 256 + assert img.width == 256 + assert img.crs == tms.rasterio_crs def test_nonearth_custom(): @@ -930,7 +882,7 @@ def test_nonearth_custom(): ) @attr.s - class MarsReader(COGReader): + class MarsReader(Reader): """Use custom geographic CRS.""" geographic_crs: rasterio.crs.CRS = attr.ib( @@ -938,14 +890,12 @@ class MarsReader(COGReader): default=rasterio.crs.CRS.from_proj4("+proj=longlat +R=3396190 +no_defs"), ) - with pytest.warns(None) as warnings: + with warnings.catch_warnings(): with MarsReader(COG_MARS, tms=mars_tms) as cog: assert cog.geographic_bounds[0] > -180 - assert len(warnings) == 0 - - with pytest.warns(None) as warnings: - with COGReader( + with warnings.catch_warnings(): + with Reader( COG_MARS, tms=mars_tms, geographic_crs=rasterio.crs.CRS.from_proj4( @@ -954,4 +904,31 @@ class MarsReader(COGReader): ) as cog: assert cog.geographic_bounds[0] > -180 - assert len(warnings) == 0 + +def test_tms_tilesize_and_zoom(): + """Test the influence of tms tilesize on COG zoom levels.""" + with Reader(COG_NODATA) as cog: + assert cog.minzoom == 5 + assert cog.maxzoom == 9 + + tms_128 = TileMatrixSet.custom( + WEB_MERCATOR_TMS.xy_bbox, + WEB_MERCATOR_TMS.crs, + title="mercator with 64 tilesize", + tile_width=64, + tile_height=64, + ) + with Reader(COG_NODATA, tms=tms_128) as cog: + assert cog.minzoom == 5 + assert cog.maxzoom == 11 + + tms_2048 = TileMatrixSet.custom( + WEB_MERCATOR_TMS.xy_bbox, + WEB_MERCATOR_TMS.crs, + title="mercator with 2048 tilesize", + tile_width=2048, + tile_height=2048, + ) + with Reader(COG_NODATA, tms=tms_2048) as cog: + assert cog.minzoom == 5 + assert cog.maxzoom == 6 diff --git a/tests/test_io_stac.py b/tests/test_io_stac.py index daf93a52..247dfbb7 100644 --- a/tests/test_io_stac.py +++ b/tests/test_io_stac.py @@ -4,6 +4,7 @@ import os from unittest.mock import patch +import numpy import pytest import rasterio @@ -119,7 +120,7 @@ def raise_for_status(self): assert s3_get.call_args[0] == ("somewhereovertherainbow.io", "mystac.json") -@patch("rio_tiler.io.cogeo.rasterio") +@patch("rio_tiler.io.rasterio.rasterio") def test_tile_valid(rio): """Should raise or return tiles.""" rio.open = mock_rasterio_open @@ -138,22 +139,29 @@ def test_tile_valid(rio): img = stac.tile(71, 102, 8, assets="green") assert img.data.shape == (1, 256, 256) assert img.mask.shape == (256, 256) - assert img.band_names == ["green_1"] + assert img.band_names == ["green_b1"] - data, mask = stac.tile(71, 102, 8, assets=("green",)) - assert data.shape == (1, 256, 256) - assert mask.shape == (256, 256) + img = stac.tile(71, 102, 8, assets=("green",)) + assert img.data.shape == (1, 256, 256) + assert img.mask.shape == (256, 256) + assert img.band_names == ["green_b1"] + + img = stac.tile(71, 102, 8, assets=("green", "red")) + assert img.data.shape == (2, 256, 256) + assert img.mask.shape == (256, 256) + assert img.band_names == ["green_b1", "red_b1"] - img = stac.tile(71, 102, 8, expression="green/red") + img = stac.tile(71, 102, 8, expression="green_b1/red_b1") assert img.data.shape == (1, 256, 256) assert img.mask.shape == (256, 256) - # Note: Here we loose the information about the band - assert img.band_names == ["green/red"] + assert img.band_names == ["green_b1/red_b1"] with pytest.warns(ExpressionMixingWarning): - img = stac.tile(71, 102, 8, assets=("green", "red"), expression="green/red") + img = stac.tile( + 71, 102, 8, assets=("green", "red"), expression="green_b1/red_b1" + ) assert img.data.shape == (1, 256, 256) - assert img.band_names == ["green/red"] + assert img.band_names == ["green_b1/red_b1"] img = stac.tile( 71, @@ -170,7 +178,7 @@ def test_tile_valid(rio): ) assert img.data.shape == (3, 256, 256) assert img.mask.shape == (256, 256) - assert img.band_names == ["green_1", "green_1", "red_1"] + assert img.band_names == ["green_b1", "green_b1", "red_b1"] # check backward compatibility for `indexes` img = stac.tile( @@ -178,25 +186,29 @@ def test_tile_valid(rio): 102, 8, assets=("green", "red"), - indexes=1, + indexes=(1, 1), ) - assert img.data.shape == (2, 256, 256) + assert img.data.shape == (4, 256, 256) assert img.mask.shape == (256, 256) - assert img.band_names == ["green_1", "red_1"] + assert img.band_names == ["green_b1", "green_b1", "red_b1", "red_b1"] - img = stac.tile( - 71, - 102, - 8, - assets=("green", "red"), - asset_expression={"green": "b1*2;b1", "red": "b1*2"}, - ) + img = stac.tile(71, 102, 8, expression="green_b1*2;green_b1;red_b1*2") assert img.data.shape == (3, 256, 256) assert img.mask.shape == (256, 256) assert img.band_names == ["green_b1*2", "green_b1", "red_b1*2"] + # Should raise KeyError because of missing band 2 + with pytest.raises(KeyError): + img = stac.tile( + 71, + 102, + 8, + expression="green_b1/red_b2", + asset_indexes={"green": 1, "red": 1}, + ) + -@patch("rio_tiler.io.cogeo.rasterio") +@patch("rio_tiler.io.rasterio.rasterio") def test_part_valid(rio): """Should raise or return data.""" rio.open = mock_rasterio_open @@ -214,25 +226,25 @@ def test_part_valid(rio): img = stac.part(bbox, assets="green") assert img.data.shape == (1, 73, 83) assert img.mask.shape == (73, 83) - assert img.band_names == ["green_1"] + assert img.band_names == ["green_b1"] - data, mask = stac.part(bbox, assets=("green",)) - assert data.shape == (1, 73, 83) - assert mask.shape == (73, 83) + img = stac.part(bbox, assets=("green",)) + assert img.data.shape == (1, 73, 83) + assert img.mask.shape == (73, 83) - img = stac.part(bbox, expression="green/red") + img = stac.part(bbox, expression="green_b1/red_b1") assert img.data.shape == (1, 73, 83) assert img.mask.shape == (73, 83) - assert img.band_names == ["green/red"] + assert img.band_names == ["green_b1/red_b1"] - data, mask = stac.part(bbox, assets="green", max_size=30) - assert data.shape == (1, 27, 30) - assert mask.shape == (27, 30) + img = stac.part(bbox, assets="green", max_size=30) + assert img.data.shape == (1, 27, 30) + assert img.mask.shape == (27, 30) with pytest.warns(ExpressionMixingWarning): - img = stac.part(bbox, assets=("green", "red"), expression="green/red") + img = stac.part(bbox, assets=("green", "red"), expression="green_b1/red_b1") assert img.data.shape == (1, 73, 83) - assert img.band_names == ["green/red"] + assert img.band_names == ["green_b1/red_b1"] img = stac.part( bbox, @@ -247,24 +259,20 @@ def test_part_valid(rio): ) assert img.data.shape == (3, 73, 83) assert img.mask.shape == (73, 83) - assert img.band_names == ["green_1", "green_1", "red_1"] + assert img.band_names == ["green_b1", "green_b1", "red_b1"] img = stac.part(bbox, assets=("green", "red"), indexes=1) assert img.data.shape == (2, 73, 83) assert img.mask.shape == (73, 83) - assert img.band_names == ["green_1", "red_1"] + assert img.band_names == ["green_b1", "red_b1"] - img = stac.part( - bbox, - assets=("green", "red"), - asset_expression={"green": "b1*2;b1", "red": "b1*2"}, - ) + img = stac.part(bbox, expression="green_b1*2;green_b1;red_b1*2") assert img.data.shape == (3, 73, 83) assert img.mask.shape == (73, 83) assert img.band_names == ["green_b1*2", "green_b1", "red_b1*2"] -@patch("rio_tiler.io.cogeo.rasterio") +@patch("rio_tiler.io.rasterio.rasterio") def test_preview_valid(rio): """Should raise or return data.""" rio.open = mock_rasterio_open @@ -280,21 +288,21 @@ def test_preview_valid(rio): img = stac.preview(assets="green") assert img.data.shape == (1, 259, 255) assert img.mask.shape == (259, 255) - assert img.band_names == ["green_1"] + assert img.band_names == ["green_b1"] - data, mask = stac.preview(assets=("green",)) - assert data.shape == (1, 259, 255) - assert mask.shape == (259, 255) + img = stac.preview(assets=("green",)) + assert img.data.shape == (1, 259, 255) + assert img.mask.shape == (259, 255) - img = stac.preview(expression="green/red") + img = stac.preview(expression="green_b1/red_b1") assert img.data.shape == (1, 259, 255) assert img.mask.shape == (259, 255) - assert img.band_names == ["green/red"] + assert img.band_names == ["green_b1/red_b1"] with pytest.warns(ExpressionMixingWarning): - img = stac.preview(assets=("green", "red"), expression="green/red") + img = stac.preview(assets=("green", "red"), expression="green_b1/red_b1") assert img.data.shape == (1, 259, 255) - assert img.band_names == ["green/red"] + assert img.band_names == ["green_b1/red_b1"] img = stac.preview( assets=("green", "red"), @@ -308,23 +316,20 @@ def test_preview_valid(rio): ) assert img.data.shape == (3, 259, 255) assert img.mask.shape == (259, 255) - assert img.band_names == ["green_1", "green_1", "red_1"] + assert img.band_names == ["green_b1", "green_b1", "red_b1"] img = stac.preview(assets=("green", "red"), indexes=1) assert img.data.shape == (2, 259, 255) assert img.mask.shape == (259, 255) - assert img.band_names == ["green_1", "red_1"] + assert img.band_names == ["green_b1", "red_b1"] - img = stac.preview( - assets=("green", "red"), - asset_expression={"green": "b1*2;b1", "red": "b1*2"}, - ) + img = stac.preview(expression="green_b1*2;green_b1;red_b1*2") assert img.data.shape == (3, 259, 255) assert img.mask.shape == (259, 255) assert img.band_names == ["green_b1*2", "green_b1", "red_b1*2"] -@patch("rio_tiler.io.cogeo.rasterio") +@patch("rio_tiler.io.rasterio.rasterio") def test_point_valid(rio): """Should raise or return data.""" rio.open = mock_rasterio_open @@ -337,53 +342,52 @@ def test_point_valid(rio): with pytest.raises(MissingAssets): stac.point(-80.477, 33.4453) - data = stac.point(-80.477, 33.4453, assets="green") - assert len(data) == 1 + pt = stac.point(-80.477, 33.4453, assets="green") + assert len(pt.data) == 1 + assert pt.band_names == ["green_b1"] + + pt = stac.point(-80.477, 33.4453, assets=("green",)) + assert len(pt.data) == 1 + assert pt.band_names == ["green_b1"] - data = stac.point(-80.477, 33.4453, assets=("green",)) - assert len(data) == 1 + pt = stac.point(-80.477, 33.4453, assets=("green", "red")) + assert len(pt.data) == 2 + assert numpy.array_equal(pt.data, numpy.array([7994, 7003])) + assert pt.band_names == ["green_b1", "red_b1"] - data = stac.point(-80.477, 33.4453, expression="green/red") - assert len(data) == 1 + pt = stac.point(-80.477, 33.4453, expression="green_b1/red_b1") + assert len(pt.data) == 1 + assert numpy.array_equal(pt.data, numpy.array([7994 / 7003])) + assert pt.band_names == ["green_b1/red_b1"] with pytest.warns(ExpressionMixingWarning): - data = stac.point( - -80.477, 33.4453, assets=("green", "red"), expression="green/red" + pt = stac.point( + -80.477, 33.4453, assets=("green", "red"), expression="green_b1/red_b1" ) - assert len(data) == 1 + assert len(pt.data) == 1 + assert pt.band_names == ["green_b1/red_b1"] - data = stac.point( + pt = stac.point( -80.477, 33.4453, assets=("green", "red"), asset_indexes={"green": (1, 1), "red": 1}, ) - assert len(data) == 2 - assert len(data[0]) == 2 - assert len(data[1]) == 1 + assert len(pt.data) == 3 + assert numpy.array_equal(pt.data, numpy.array([7994, 7994, 7003])) + assert pt.band_names == ["green_b1", "green_b1", "red_b1"] - data = stac.point( - -80.477, - 33.4453, - assets=("green", "red"), - indexes=1, - ) - assert len(data) == 2 - assert len(data[0]) == 1 - assert len(data[1]) == 1 + pt = stac.point(-80.477, 33.4453, assets=("green", "red"), indexes=1) + assert len(pt.data) == 2 + assert numpy.array_equal(pt.data, numpy.array([7994, 7003])) + assert pt.band_names == ["green_b1", "red_b1"] - data = stac.point( - -80.477, - 33.4453, - assets=("green", "red"), - asset_expression={"green": "b1*2;b1", "red": "b1*2"}, - ) - assert len(data) == 2 - assert len(data[0]) == 2 - assert len(data[1]) == 1 + pt = stac.point(-80.477, 33.4453, expression="green_b1*2;green_b1;red_b1*2") + assert len(pt.data) == 3 + assert pt.band_names == ["green_b1*2", "green_b1", "red_b1*2"] -@patch("rio_tiler.io.cogeo.rasterio") +@patch("rio_tiler.io.rasterio.rasterio") def test_statistics_valid(rio): """Should raise or return data.""" rio.open = mock_rasterio_open @@ -400,11 +404,11 @@ def test_statistics_valid(rio): stats = stac.statistics(assets="green") assert stats["green"] - assert isinstance(stats["green"]["1"], BandStatistics) + assert isinstance(stats["green"]["b1"], BandStatistics) stats = stac.statistics(assets=("green", "red"), hist_options={"bins": 20}) assert len(stats) == 2 - assert len(stats["green"]["1"]["histogram"][0]) == 20 + assert len(stats["green"]["b1"]["histogram"][0]) == 20 # Check that asset_expression is passed stats = stac.statistics( @@ -419,17 +423,17 @@ def test_statistics_valid(rio): assets=("green", "red"), asset_indexes={"green": 1, "red": 1} ) assert stats["green"] - assert isinstance(stats["green"]["1"], BandStatistics) - assert isinstance(stats["red"]["1"], BandStatistics) + assert isinstance(stats["green"]["b1"], BandStatistics) + assert isinstance(stats["red"]["b1"], BandStatistics) # Check that asset_indexes is passed stats = stac.statistics(assets=("green", "red"), indexes=1) assert stats["green"] - assert isinstance(stats["green"]["1"], BandStatistics) - assert isinstance(stats["red"]["1"], BandStatistics) + assert isinstance(stats["green"]["b1"], BandStatistics) + assert isinstance(stats["red"]["b1"], BandStatistics) -@patch("rio_tiler.io.cogeo.rasterio") +@patch("rio_tiler.io.rasterio.rasterio") def test_merged_statistics_valid(rio): """Should raise or return data.""" rio.open = mock_rasterio_open @@ -438,28 +442,25 @@ def test_merged_statistics_valid(rio): with pytest.warns(UserWarning): stats = stac.merged_statistics() assert len(stats) == 3 - assert isinstance(stats["red_1"], BandStatistics) - assert stats["red_1"] - assert stats["green_1"] - assert stats["blue_1"] + assert isinstance(stats["red_b1"], BandStatistics) + assert stats["red_b1"] + assert stats["green_b1"] + assert stats["blue_b1"] with pytest.raises(InvalidAssetName): stac.merged_statistics(assets="vert") stats = stac.merged_statistics(assets="green") - assert isinstance(stats["green_1"], BandStatistics) + assert isinstance(stats["green_b1"], BandStatistics) stats = stac.merged_statistics( assets=("green", "red"), hist_options={"bins": 20} ) assert len(stats) == 2 - assert len(stats["green_1"]["histogram"][0]) == 20 - assert len(stats["red_1"]["histogram"][0]) == 20 + assert len(stats["green_b1"]["histogram"][0]) == 20 + assert len(stats["red_b1"]["histogram"][0]) == 20 - # Check that asset_expression is passed - stats = stac.merged_statistics( - assets=("green", "red"), asset_expression={"green": "b1*2", "red": "b1+100"} - ) + stats = stac.merged_statistics(expression="green_b1*2;green_b1;red_b1+100") assert isinstance(stats["green_b1*2"], BandStatistics) assert isinstance(stats["red_b1+100"], BandStatistics) @@ -467,22 +468,11 @@ def test_merged_statistics_valid(rio): stats = stac.merged_statistics( assets=("green", "red"), asset_indexes={"green": 1, "red": 1} ) - assert isinstance(stats["green_1"], BandStatistics) - assert isinstance(stats["red_1"], BandStatistics) - - # Check Expression - stats = stac.merged_statistics(expression="green/red") - assert isinstance(stats["green/red"], BandStatistics) + assert isinstance(stats["green_b1"], BandStatistics) + assert isinstance(stats["red_b1"], BandStatistics) - # Check that we can use expression and asset_expression - stats = stac.merged_statistics( - expression="green/red", - asset_expression={"green": "b1*2", "red": "b1+100"}, - ) - assert isinstance(stats["green/red"], BandStatistics) - -@patch("rio_tiler.io.cogeo.rasterio") +@patch("rio_tiler.io.rasterio.rasterio") def test_info_valid(rio): """Should raise or return data.""" rio.open = mock_rasterio_open @@ -506,16 +496,30 @@ def test_info_valid(rio): def test_parse_expression(): - """.""" + """Parse assets expressions.""" with STACReader(STAC_PATH) as stac: - assert sorted(stac.parse_expression("green*red+red/blue+2.0")) == [ + assert sorted( + stac.parse_expression("green_b1*red_b1+red_b1/blue_b1+2.0;red_b1") + ) == [ "blue", "green", "red", ] + # make sure we match full word only + with STACReader(STAC_PATH) as stac: + assert sorted( + stac.parse_expression("greenish_b1*red_b1+red_b1/blue_b1+2.0;red_b1") + ) == ["blue", "red"] -@patch("rio_tiler.io.cogeo.rasterio") + # make sure we match full word only + with STACReader(STAC_PATH) as stac: + assert sorted( + stac.parse_expression("green_b10foo*red_b1+red_b1/blue_b1+2.0;red_b1") + ) == ["blue", "red"] + + +@patch("rio_tiler.io.rasterio.rasterio") def test_feature_valid(rio): """Should raise or return data.""" rio.open = mock_rasterio_open @@ -553,43 +557,41 @@ def test_feature_valid(rio): img = stac.feature(feat, assets="green") assert img.data.shape == (1, 118, 96) assert img.mask.shape == (118, 96) - assert img.band_names == ["green_1"] + assert img.band_names == ["green_b1"] - data, mask = stac.feature(feat, assets=("green",)) - assert data.shape == (1, 118, 96) - assert mask.shape == (118, 96) + img = stac.feature(feat, assets=("green",)) + assert img.data.shape == (1, 118, 96) + assert img.mask.shape == (118, 96) - img = stac.feature(feat, expression="green/red") + img = stac.feature(feat, expression="green_b1/red_b1") assert img.data.shape == (1, 118, 96) assert img.mask.shape == (118, 96) - assert img.band_names == ["green/red"] + assert img.band_names == ["green_b1/red_b1"] - data, mask = stac.feature(feat, assets="green", max_size=30) - assert data.shape == (1, 30, 25) - assert mask.shape == (30, 25) + img = stac.feature(feat, assets="green", max_size=30) + assert img.data.shape == (1, 30, 25) + assert img.mask.shape == (30, 25) with pytest.warns(ExpressionMixingWarning): - img = stac.feature(feat, assets=("green", "red"), expression="green/red") + img = stac.feature( + feat, assets=("green", "red"), expression="green_b1/red_b1" + ) assert img.data.shape == (1, 118, 96) - assert img.band_names == ["green/red"] + assert img.band_names == ["green_b1/red_b1"] img = stac.feature( feat, assets=("green", "red"), asset_indexes={"green": (1, 1), "red": 1} ) assert img.data.shape == (3, 118, 96) assert img.mask.shape == (118, 96) - assert img.band_names == ["green_1", "green_1", "red_1"] + assert img.band_names == ["green_b1", "green_b1", "red_b1"] img = stac.feature(feat, assets=("green", "red"), indexes=1) assert img.data.shape == (2, 118, 96) assert img.mask.shape == (118, 96) - assert img.band_names == ["green_1", "red_1"] + assert img.band_names == ["green_b1", "red_b1"] - img = stac.feature( - feat, - assets=("green", "red"), - asset_expression={"green": "b1*2;b1", "red": "b1*2"}, - ) + img = stac.feature(feat, expression="green_b1*2;green_b1;red_b1*2") assert img.data.shape == (3, 118, 96) assert img.mask.shape == (118, 96) assert img.band_names == ["green_b1*2", "green_b1", "red_b1*2"] @@ -662,3 +664,16 @@ def raise_for_status(self): s3_get.assert_called_once() assert s3_get.call_args[1]["request_pays"] assert s3_get.call_args[0] == ("somewhereovertherainbow.io", "mystac.json") + + +@patch("rio_tiler.io.rasterio.rasterio") +def test_img_dataset_stats(rio): + """Make sure dataset statistics are forwarded.""" + rio.open = mock_rasterio_open + + with STACReader(STAC_PATH) as stac: + img = stac.preview(assets=("green", "red")) + assert img.dataset_statistics == [(6883, 62785), (6101, 65035)] + + img = stac.preview(expression="green_b1/red_b1") + assert img.dataset_statistics == [(6883 / 65035, 62785 / 6101)] diff --git a/tests/test_io_xarray.py b/tests/test_io_xarray.py new file mode 100644 index 00000000..c4f1cf1b --- /dev/null +++ b/tests/test_io_xarray.py @@ -0,0 +1,87 @@ +"""tests rio_tiler.io.xarray.XarrayReader""" + +import os +from datetime import datetime + +import numpy +import xarray + +from rio_tiler.io import XarrayReader + +PREFIX = os.path.join(os.path.dirname(__file__), "fixtures") + +planet = os.path.join(PREFIX, "PLANET_SCOPE_3D.nc") + + +def test_xarray_reader(): + """test XarrayReader.""" + arr = numpy.random.randn(1, 33, 35) + data = xarray.DataArray( + arr, + dims=("time", "y", "x"), + coords={ + "x": list(range(-170, 180, 10)), + "y": list(range(-80, 85, 5)), + "time": [datetime(2022, 1, 1)], + }, + ) + data.attrs.update({"valid_min": arr.min(), "valid_max": arr.max()}) + + data.rio.write_crs("epsg:4326", inplace=True) + with XarrayReader(data) as dst: + info = dst.info() + assert info.minzoom == 0 + assert info.maxzoom == 0 + assert info.band_metadata == [("b1", {})] + assert info.band_descriptions == [("b1", "2022-01-01T00:00:00.000000000")] + assert info.height == 33 + assert info.width == 35 + assert info.count == 1 + assert info.attrs + + with XarrayReader(data) as dst: + img = dst.tile(0, 0, 0) + assert img.count == 1 + assert img.width == 256 + assert img.height == 256 + assert img.band_names == ["2022-01-01T00:00:00.000000000"] + assert img.dataset_statistics == ((arr.min(), arr.max()),) + + img = dst.part((-160, -80, 160, 80)) + assert img.count == 1 + assert img.band_names == ["2022-01-01T00:00:00.000000000"] + + pt = dst.point(0, 0) + assert pt.count == 1 + assert pt.band_names == ["2022-01-01T00:00:00.000000000"] + assert pt.coordinates + + feat = { + "type": "Feature", + "properties": {}, + "geometry": { + "type": "Polygon", + "coordinates": [ + [ + [-92.46093749999999, 72.91963546581484], + [-148.0078125, 33.137551192346145], + [-143.08593749999997, -28.613459424004414], + [43.9453125, -47.04018214480665], + [142.734375, -12.897489183755892], + [157.5, 68.13885164925573], + [58.71093750000001, 74.95939165894974], + [-40.42968749999999, 75.14077784070429], + [-92.46093749999999, 72.91963546581484], + ] + ], + }, + } + img = dst.feature(feat) + assert img.count == 1 + assert img.band_names == ["2022-01-01T00:00:00.000000000"] + + img = dst.feature(feat, dst_crs="epsg:3857") + assert img.count == 1 + assert img.band_names == ["2022-01-01T00:00:00.000000000"] + assert img.crs.to_epsg() == 3857 + print(img) diff --git a/tests/test_mask.py b/tests/test_mask.py index b86a8da6..8a6e4d96 100644 --- a/tests/test_mask.py +++ b/tests/test_mask.py @@ -8,7 +8,7 @@ from rasterio.coords import BoundingBox from rasterio.crs import CRS -from rio_tiler.io import COGReader +from rio_tiler.io import Reader tiles = { "masked": morecantile.Tile(x=535, y=498, z=10), @@ -43,20 +43,23 @@ def test_mask_bilinear(cloudoptimized_geotiff): src_path = cloudoptimized_geotiff( cog_path, **equator, dtype="uint8", nodata_type="alpha" ) - with COGReader(src_path) as cog: + with Reader(src_path) as cog: data, mask = cog.preview( resampling_method="bilinear", force_binary_mask=True, + max_size=100, ) masknodata = (data[0] != 0).astype(numpy.uint8) * 255 numpy.testing.assert_array_equal(mask, masknodata) - data, mask = cog.preview( + dataf, maskf = cog.preview( resampling_method="bilinear", force_binary_mask=False, + max_size=100, ) - masknodata = (data[0] != 0).astype(numpy.uint8) * 255 - assert not numpy.array_equal(mask, masknodata) + masknodata = (dataf[0] != 0).astype(numpy.uint8) * 255 + assert not numpy.array_equal(maskf, masknodata) + assert not numpy.array_equal(maskf, mask) @pytest.mark.parametrize("resampling", ["bilinear", "nearest"]) @@ -67,7 +70,7 @@ def test_mask(dataset_info, tile_name, resampling, cloudoptimized_geotiff): src_path = cloudoptimized_geotiff(cog_path, **dataset_info) tile = tiles[tile_name] - with COGReader(src_path) as cog: + with Reader(src_path) as cog: data, mask = cog.tile( tile.x, tile.y, diff --git a/tests/test_models.py b/tests/test_models.py index eea50727..2dd14c74 100644 --- a/tests/test_models.py +++ b/tests/test_models.py @@ -5,6 +5,7 @@ import numpy import pytest import rasterio +from rasterio.io import MemoryFile from rio_tiler.errors import InvalidDatatypeWarning from rio_tiler.models import ImageData @@ -121,3 +122,57 @@ def test_merge_with_diffsize(): img2 = ImageData(numpy.zeros((1, 256, 256))) img = ImageData.create_from_list([img1, img2]) assert len(w) == 0 + + +def test_apply_expression(): + """Apply expression""" + img = ImageData(numpy.zeros((2, 256, 256))) + img2 = img.apply_expression("b1+b2") + assert img.count == 2 + assert img.width == 256 + assert img.height == 256 + assert img.band_names == ["b1", "b2"] + assert img2.count == 1 + assert img2.width == 256 + assert img2.height == 256 + assert img2.band_names == ["b1+b2"] + + +def test_dataset_statistics(): + """Make statistics are preserved on expression""" + data = numpy.zeros((2, 256, 256), dtype="uint8") + data[0, 0:10, 0:10] = 0 + data[0, 10:11, 10:11] = 100 + data[1, 0:10, 0:10] = 100 + data[1, 10:11, 10:11] = 200 + img = ImageData(data, dataset_statistics=[(0, 100), (0, 200)]) + + img2 = img.apply_expression("b1+b2") + assert img2.dataset_statistics == [(0, 300)] + + img2 = img.apply_expression("b1+b2;b1*b2;b1/b1") + assert img2.dataset_statistics == [(0, 300), (0, 20000), (0, 1)] + assert img2.data[0].min() == 0 + assert img2.data[0].max() == 300 + assert img2.data[1].min() == 0 + assert img2.data[1].max() == 20000 + assert img2.data[2].min() == 0 + assert img2.data[2].max() == 1 + + data = numpy.zeros((1, 256, 256), dtype="int16") + data[0, 0:10, 0:10] = 0 + data[0, 10:11, 10:11] = 1 + + img = ImageData(data, dataset_statistics=[(0, 1)]).render(img_format="PNG") + with MemoryFile(img) as mem: + with mem.open() as dst: + arr = dst.read(indexes=1) + assert arr.min() == 0 + assert arr.max() == 255 + + img = ImageData(data).render(img_format="PNG") + with MemoryFile(img) as mem: + with mem.open() as dst: + arr = dst.read(indexes=1) + assert not arr.min() == 0 + assert not arr.max() == 255 diff --git a/tests/test_mosaic.py b/tests/test_mosaic.py index d2d76f39..8d5a3178 100644 --- a/tests/test_mosaic.py +++ b/tests/test_mosaic.py @@ -11,7 +11,7 @@ from rio_tiler import mosaic from rio_tiler.constants import WEB_MERCATOR_TMS, WGS84_CRS from rio_tiler.errors import EmptyMosaicError, InvalidMosaicMethod, TileOutsideBounds -from rio_tiler.io import COGReader, STACReader +from rio_tiler.io import Reader, STACReader from rio_tiler.models import ImageData from rio_tiler.mosaic.methods import defaults from rio_tiler.types import DataMaskType @@ -41,19 +41,19 @@ def _read_tile(src_path: str, *args, **kwargs) -> ImageData: """Read tile from an asset""" - with COGReader(src_path) as cog: + with Reader(src_path) as cog: return cog.tile(*args, **kwargs) def _read_part(src_path: str, *args, **kwargs) -> ImageData: """Read part from an asset""" - with COGReader(src_path) as cog: + with Reader(src_path) as cog: return cog.part(*args, **kwargs) def _read_preview(src_path: str, *args, **kwargs) -> DataMaskType: """Read preview from an asset""" - with COGReader(src_path) as cog: + with Reader(src_path) as cog: data, mask = cog.preview(*args, **kwargs) return data, mask @@ -69,10 +69,10 @@ def test_mosaic_tiler(): assert t.dtype == m.dtype img, _ = mosaic.mosaic_reader(assets, _read_tile, x, y, z) - assert img.band_names == ["1", "2", "3"] + assert img.band_names == ["b1", "b2", "b3"] img, _ = mosaic.mosaic_reader(assets, _read_tile, x, y, z, indexes=[1]) - assert img.band_names == ["1"] + assert img.band_names == ["b1"] img, _ = mosaic.mosaic_reader(assets, _read_tile, x, y, z, expression="b1*3") assert img.band_names == ["b1*3"] @@ -249,7 +249,7 @@ def mock_rasterio_open(asset): return rasterio.open(asset) -@patch("rio_tiler.io.cogeo.rasterio") +@patch("rio_tiler.io.rasterio.rasterio") def test_stac_mosaic_tiler(rio): """Test mosaic tiler with STACReader.""" rio.open = mock_rasterio_open @@ -281,7 +281,7 @@ def _reader(src_path: str, *args, **kwargs) -> ImageData: assets="green", threads=0, ) - assert img.band_names == ["green_1"] + assert img.band_names == ["green_b1"] img, _ = mosaic.mosaic_reader( [stac_asset], @@ -289,23 +289,11 @@ def _reader(src_path: str, *args, **kwargs) -> ImageData: 71, 102, 8, - assets=["green"], - asset_expression={"green": "b1*2"}, + expression="green_b1*2", threads=0, ) assert img.band_names == ["green_b1*2"] - img, _ = mosaic.mosaic_reader( - [stac_asset], - _reader, - 71, - 102, - 8, - expression="green*2", - threads=0, - ) - assert img.band_names == ["green*2"] - def test_mosaic_tiler_Stdev(): """Test Stdev mosaic methods.""" @@ -440,10 +428,10 @@ def test_mosaic_tiler_with_imageDataClass(): assert not img.bounds bbox = [-75.98703377413767, 44.93504283293786, -71.337604723999, 47.09685599202324] - with COGReader(assets[0]) as cog: + with Reader(assets[0]) as cog: crs1 = cog.dataset.crs - with COGReader(assets[0]) as cog: + with Reader(assets[0]) as cog: crs2 = cog.dataset.crs img, assets_used = mosaic.mosaic_reader( @@ -456,4 +444,5 @@ def test_mosaic_tiler_with_imageDataClass(): assert img.crs == crs1 == crs2 assert not img.bounds == bbox bbox_in_crs = transform_bounds(WGS84_CRS, crs1, *bbox, densify_pts=21) - assert img.bounds == bbox_in_crs + for xc, yc in zip(img.bounds, bbox_in_crs): + assert round(xc, 5) == round(yc, 5) diff --git a/tests/test_reader.py b/tests/test_reader.py index 4c1884f5..4e6bbe89 100644 --- a/tests/test_reader.py +++ b/tests/test_reader.py @@ -5,6 +5,7 @@ import numpy import pytest import rasterio +from rasterio.warp import transform_bounds from rio_tiler import constants, reader from rio_tiler.errors import PointOutsideBounds, TileOutsideBounds @@ -368,22 +369,253 @@ def test_tile_read_vrt_option(): def test_point(): """Read point values""" + with rasterio.open(COG) as src_dst: + pt = reader.point( + src_dst, + [-53.54620193828792, 73.28439084323475], + coord_crs="epsg:4326", + indexes=1, + nodata=1, + ) + assert pt.data == numpy.array([1]) + assert pt.mask == numpy.array([0]) + assert pt.band_names == ["b1"] + with rasterio.open(COG_SCALE) as src_dst: - p = reader.point(src_dst, [310000, 4100000], coord_crs=src_dst.crs, indexes=1) - assert p == [8917] + pt = reader.point(src_dst, [310000, 4100000], coord_crs=src_dst.crs, indexes=1) + assert pt.data == numpy.array([8917]) + assert pt.mask == numpy.array([255]) + assert pt.band_names == ["b1"] - p = reader.point(src_dst, [310000, 4100000], coord_crs=src_dst.crs) - assert p == [8917] + pt = reader.point(src_dst, [310000, 4100000], coord_crs=src_dst.crs) + assert pt.data == numpy.array([8917]) + assert pt.band_names == ["b1"] with pytest.raises(PointOutsideBounds): reader.point(src_dst, [810000, 4100000], coord_crs=src_dst.crs) - with rasterio.open(S3_MASK_PATH) as src_dst: - # Test with COG + internal mask - assert not reader.point(src_dst, [-104.7753105, 38.953548])[0] - assert reader.point(src_dst, [-104.7753105415, 38.953548], masked=False)[0] == 0 - with rasterio.open(S3_ALPHA_PATH) as src_dst: # Test with COG + Alpha Band - assert not reader.point(src_dst, [-104.77519499, 38.95367054])[0] - assert reader.point(src_dst, [-104.77519499, 38.95367054], masked=False)[0] == 0 + assert reader.point(src_dst, [-104.77519499, 38.95367054]).data[0] + assert ( + reader.point(src_dst, [-104.77519499, 38.95367054]).mask[0] == 0 + ) # Masked + + +def test_part_with_buffer(): + """Make sure buffer works as expected.""" + bounds = [ + -6574807.42497772, + 12210356.646387195, + -6261721.357121638, + 12523442.714243278, + ] + # Read part at full resolution + with rasterio.open(COG) as src_dst: + img_no_buffer = reader.part(src_dst, bounds, dst_crs=constants.WEB_MERCATOR_CRS) + + x_size = img_no_buffer.width + y_size = img_no_buffer.height + + x_res = (bounds[2] - bounds[0]) / x_size + y_res = (bounds[3] - bounds[1]) / y_size + + nx = x_size + 4 + ny = y_size + 4 + + # apply a 2 pixel buffer + bounds_with_buffer = ( + bounds[0] - x_res * 2, + bounds[1] - y_res * 2, + bounds[2] + x_res * 2, + bounds[3] + y_res * 2, + ) + with rasterio.open(COG) as src_dst: + img = reader.part( + src_dst, + bounds_with_buffer, + height=ny, + width=nx, + dst_crs=constants.WEB_MERCATOR_CRS, + ) + assert img.width == nx + assert img.height == ny + + with rasterio.open(COG) as src_dst: + imgb = reader.part( + src_dst, bounds, buffer=2, dst_crs=constants.WEB_MERCATOR_CRS + ) + assert imgb.width == nx + assert imgb.height == ny + + assert numpy.array_equal(img.data, imgb.data) + assert img.bounds == imgb.bounds + + # No resampling is involved. Because we read the full resolution data + # all arrays should be equal + numpy.array_equal(img_no_buffer.data, imgb.data[:, 2:-2, 2:-2]) + numpy.array_equal(img_no_buffer.data, img.data[:, 2:-2, 2:-2]) + + +def test_read(): + """Test reader.read function.""" + with rasterio.open(COG) as src: + img = reader.read(src) + assert img.width == src.width + assert img.height == src.height + assert img.count == src.count + assert img.bounds == src.bounds + assert img.crs == src.crs + + with rasterio.open(COG) as src: + with pytest.warns(UserWarning): + img = reader.read(src, max_size=1000, width=100, height=100) + assert img.width == 100 + assert img.height == 100 + assert img.count == src.count + assert img.bounds == src.bounds + assert img.crs == src.crs + + with rasterio.open(COG) as src: + img = reader.read(src, width=100, height=100) + assert img.width == 100 + assert img.height == 100 + assert img.count == src.count + assert img.bounds == src.bounds + assert img.crs == src.crs + + with rasterio.open(COG) as src: + img = reader.read(src, max_size=100) + assert max(img.width, img.height) == 100 + assert img.count == src.count + assert img.bounds == src.bounds + assert img.crs == src.crs + + with rasterio.open(COG) as src: + img = reader.read(src, dst_crs="epsg:3857") + assert not img.width == src.width + assert not img.height == src.height + assert img.count == src.count + assert not img.bounds == src.bounds + assert not img.crs == src.crs + + with rasterio.open(COG) as src: + img = reader.read(src) + assert img.mask.all() + + with rasterio.open(COG) as src: + img = reader.read(src, nodata=1) + assert not img.mask.all() + + with rasterio.open(COG) as src: + img = reader.read(src, window=((0, 100), (0, 100))) + assert img.width == 100 + assert img.height == 100 + assert img.count == src.count + assert not img.bounds == src.bounds + assert img.crs == src.crs + + # Boundless Read + with rasterio.open(COG) as src: + img = reader.read(src, window=((-10, 100), (-10, 100))) + assert img.width == 110 + assert img.height == 110 + assert img.count == src.count + assert not img.bounds == src.bounds + assert img.crs == src.crs + + with rasterio.open(COG) as src: + img = reader.read(src, window=((0, 4000), (0, 4000))) + assert img.width == 4000 + assert img.height == 4000 + assert img.count == src.count + assert not img.bounds == src.bounds + assert img.crs == src.crs + + # Can't use boundless window with WarpedVRT + with rasterio.open(COG) as src: + with pytest.raises(ValueError): + reader.read(src, window=((0, 4000), (0, 4000)), dst_crs="epsg:3857") + + # Unscale Dataset + with rasterio.open(COG_SCALE) as src: + assert not src.dtypes[0] == numpy.float32 + img = reader.read(src, unscale=True) + assert img.data.dtype == numpy.float32 + + # Dataset with Alpha using WarpedVRT + with rasterio.open(S3_ALPHA_PATH) as src: + img = reader.read(src, dst_crs="epsg:3857") + assert not img.mask.all() + + +def test_part_no_VRT(): + """Test reader.part function without VRT.""" + bounds = [ + -56.6015625, + 73.0001215118412, + -51.67968749999999, + 74.23886253330774, + ] # boundless part + # Read part at full resolution + with rasterio.open(COG) as src_dst: + + bounds_dst_crs = transform_bounds( + "epsg:4326", src_dst.crs, *bounds, densify_pts=21 + ) + + img = reader.part(src_dst, bounds, bounds_crs="epsg:4326") + assert img.height == 1453 + assert img.width == 1613 + assert img.mask[0, 0] == 255 + assert img.mask[-1, -1] == 0 # boundless + assert img.bounds == bounds_dst_crs + + # Use bbox in Image CRS + img_crs = reader.part(src_dst, bounds_dst_crs) + assert img.height == 1453 + assert img.width == 1613 + assert img_crs.mask[0, 0] == 255 + assert img_crs.mask[-1, -1] == 0 # boundless + assert img.bounds == bounds_dst_crs + + # MaxSize + img = reader.part(src_dst, bounds, bounds_crs="epsg:4326", max_size=1024) + assert img.height < 1024 + assert img.width == 1024 + assert img.mask[0, 0] == 255 + assert img.mask[-1, -1] == 0 # boundless + assert img.bounds == bounds_dst_crs + + # Width/Height + img = reader.part( + src_dst, + bounds, + bounds_crs="epsg:4326", + width=100, + height=100, + ) + assert img.height == 100 + assert img.width == 100 + assert img.mask[0, 0] == 255 + assert img.mask[-1, -1] == 0 # boundless + assert img.bounds == bounds_dst_crs + + # Buffer + img = reader.part(src_dst, bounds, bounds_crs="epsg:4326", buffer=1) + assert img.height == 1455 + assert img.width == 1615 + assert img.mask[0, 0] == 255 + assert img.mask[-1, -1] == 0 # boundless + assert not img.bounds == bounds_dst_crs + + # Padding + img = reader.part(src_dst, bounds, bounds_crs="epsg:4326") + img_pad = reader.part(src_dst, bounds, bounds_crs="epsg:4326", padding=1) + assert img_pad.height == 1453 + assert img_pad.width == 1613 + assert img_pad.mask[0, 0] == 255 + assert img_pad.mask[-1, -1] == 0 # boundless + assert img_pad.bounds == bounds_dst_crs + # Padding should not have any influence when not doing any rescaling/reprojection + numpy.array_equal(img_pad.data, img.data) diff --git a/tests/test_utils.py b/tests/test_utils.py index 7730023f..d125a900 100644 --- a/tests/test_utils.py +++ b/tests/test_utils.py @@ -13,7 +13,7 @@ from rio_tiler.constants import WEB_MERCATOR_TMS, WGS84_CRS from rio_tiler.errors import RioTilerError from rio_tiler.expression import parse_expression -from rio_tiler.io import COGReader +from rio_tiler.io import Reader from .conftest import requires_webp @@ -163,25 +163,17 @@ def test_aligned_with_internaltile(): """Check if COG is in WebMercator and aligned with internal tiles.""" bounds = WEB_MERCATOR_TMS.bounds(43, 25, 7) with rasterio.open(COG_DST) as src_dst: - assert not utils._requested_tile_aligned_with_internal_tile( - src_dst, bounds, 256, 256 - ) + assert not utils._requested_tile_aligned_with_internal_tile(src_dst, bounds) with rasterio.open(NOCOG) as src_dst: - assert not utils._requested_tile_aligned_with_internal_tile( - src_dst, bounds, 256, 256 - ) + assert not utils._requested_tile_aligned_with_internal_tile(src_dst, bounds) bounds = WEB_MERCATOR_TMS.bounds(147, 182, 9) with rasterio.open(COG_NOWEB) as src_dst: - assert not utils._requested_tile_aligned_with_internal_tile( - src_dst, bounds, 256, 256 - ) + assert not utils._requested_tile_aligned_with_internal_tile(src_dst, bounds) with rasterio.open(COG_WEB_TILED) as src_dst: - assert utils._requested_tile_aligned_with_internal_tile( - src_dst, bounds, 256, 256 - ) + assert utils._requested_tile_aligned_with_internal_tile(src_dst, bounds) def test_find_non_alpha(): @@ -289,7 +281,7 @@ def test_cutline(): feature_bounds = featureBounds(feat) - with COGReader(COGEO) as cog: + with Reader(COGEO) as cog: cutline = utils.create_cutline(cog.dataset, feat, geometry_crs="epsg:4326") data, mask = cog.part(feature_bounds, vrt_options={"cutline": cutline}) assert not mask.all() @@ -314,7 +306,7 @@ def test_cutline(): }, } - with COGReader(COGEO) as cog: + with Reader(COGEO) as cog: with pytest.raises(RioTilerError): utils.create_cutline(cog.dataset, feat_line, geometry_crs="epsg:4326") @@ -342,7 +334,7 @@ def test_cutline(): ], } - with COGReader(COGEO) as cog: + with Reader(COGEO) as cog: c = utils.create_cutline(cog.dataset, feat_mp, geometry_crs="epsg:4326") assert "MULTIPOLYGON" in c @@ -361,7 +353,7 @@ def test_cutline(): ], } - with COGReader(COGEO) as cog: + with Reader(COGEO) as cog: with pytest.raises(RioTilerError): utils.create_cutline(cog.dataset, bad_poly, geometry_crs="epsg:4326")