diff --git a/ci/dev.yaml b/ci/dev.yaml index 56ffe61..fd01e26 100644 --- a/ci/dev.yaml +++ b/ci/dev.yaml @@ -7,6 +7,7 @@ dependencies: # to build from source - cython - geos + - proj # testing - pytest - pytest-cov @@ -16,3 +17,4 @@ dependencies: - pip: - git+https://github.com/shapely/shapely.git@main - git+https://github.com/pydata/xarray.git@main + - git+https://github.com/pyproj4/pyproj.git diff --git a/ci/latest.yaml b/ci/latest.yaml index 9f113f4..e57ad60 100644 --- a/ci/latest.yaml +++ b/ci/latest.yaml @@ -7,6 +7,7 @@ dependencies: # required - shapely=2 - xarray + - pyproj # testing - pytest - pytest-cov diff --git a/doc/source/api.rst b/doc/source/api.rst index 0d27ae4..a16af19 100644 --- a/doc/source/api.rst +++ b/doc/source/api.rst @@ -4,6 +4,9 @@ API reference ============= +The API reference provides an overview of all public objects, functions and +methods and Xarray accessors implemented in Xvec. + Indexing -------- @@ -15,3 +18,65 @@ Indexing GeometryIndex GeometryIndex.crs GeometryIndex.sindex + + +.. currentmodule:: xarray + +Dataset.xvec +------------ + +.. _dsattr: + +Properties +~~~~~~~~~~ + +.. autosummary:: + :toctree: generated/ + :template: autosummary/accessor_attribute.rst + + Dataset.xvec.geom_coords + Dataset.xvec.geom_coords_indexed + + +.. _dsmeth: + +Methods +~~~~~~~ + +.. autosummary:: + :toctree: generated/ + :template: autosummary/accessor_method.rst + + Dataset.xvec.is_geom_variable + Dataset.xvec.set_crs + Dataset.xvec.to_crs + + +DataArray.xvec +-------------- + +.. _daattr: + +Properties +~~~~~~~~~~ + +.. autosummary:: + :toctree: generated/ + :template: autosummary/accessor_attribute.rst + + DataArray.xvec.geom_coords + DataArray.xvec.geom_coords_indexed + + +.. _dameth: + +Methods +~~~~~~~ + +.. autosummary:: + :toctree: generated/ + :template: autosummary/accessor_method.rst + + DataArray.xvec.is_geom_variable + DataArray.xvec.to_crs + DataArray.xvec.set_crs \ No newline at end of file diff --git a/doc/source/conf.py b/doc/source/conf.py index a49b0da..380a47a 100644 --- a/doc/source/conf.py +++ b/doc/source/conf.py @@ -5,6 +5,15 @@ # -- Project information ----------------------------------------------------- # https://www.sphinx-doc.org/en/master/usage/configuration.html#project-information +import os +import sys + +import sphinx_autosummary_accessors + + +sys.path.insert(0, os.path.abspath("../xvec/")) + +import xvec # noqa project = "Xvec" copyright = "2022, Xvec developers" @@ -20,9 +29,13 @@ "sphinx.ext.intersphinx", "myst_nb", "sphinx_copybutton", + "sphinx_autosummary_accessors", ] -templates_path = ["_templates"] +templates_path = [ + "_templates", + sphinx_autosummary_accessors.templates_path, +] exclude_patterns = [] intersphinx_mapping = { @@ -42,3 +55,4 @@ "github_url": "https://github.com/martinfleis/xvec", } nb_execution_mode = "off" +autodoc_typehints = "none" diff --git a/environment.yml b/environment.yml index 6968c44..bd8ddf3 100644 --- a/environment.yml +++ b/environment.yml @@ -22,3 +22,6 @@ dependencies: - flake8 - black - isort + - pip + - pip: + - sphinx_autosummary_accessors diff --git a/pyproject.toml b/pyproject.toml index 1333517..c97c6fb 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -27,7 +27,7 @@ classifiers = [ ] requires-python = ">=3.8" dependencies = [ - "xarray >= 2022.11.0", + "xarray >= 2022.12.0", "pyproj >= 3.0.0", "shapely >= 2.0b1", ] diff --git a/xvec/__init__.py b/xvec/__init__.py index 15ad2cb..44c022b 100644 --- a/xvec/__init__.py +++ b/xvec/__init__.py @@ -1,5 +1,6 @@ from importlib.metadata import PackageNotFoundError, version +from .accessor import XvecAccessor # noqa from .index import GeometryIndex # noqa try: diff --git a/xvec/accessor.py b/xvec/accessor.py new file mode 100644 index 0000000..43f18d5 --- /dev/null +++ b/xvec/accessor.py @@ -0,0 +1,496 @@ +from typing import Any, Hashable, Mapping, Union + +import numpy as np +import shapely +import xarray as xr +from pyproj import CRS, Transformer + +from .index import GeometryIndex + + +@xr.register_dataarray_accessor("xvec") +@xr.register_dataset_accessor("xvec") +class XvecAccessor: + """Access geometry-based methods for DataArrays and Datasets with Shapely geometry. + + Currently works on coordinates with :class:`xvec.GeometryIndex`. + """ + + def __init__(self, xarray_obj: Union[xr.Dataset, xr.DataArray]): + """xvec init, nothing to be done here.""" + self._obj = xarray_obj + self._geom_coords_all = [ + name + for name in self._obj.coords + if self.is_geom_variable(name, has_index=False) + ] + self._geom_indexes = [ + name + for name in self._obj.coords + if self.is_geom_variable(name, has_index=True) + ] + + def is_geom_variable(self, name: Hashable, has_index: bool = True): + """Check if coordinate variable is composed of :class:`shapely.Geometry`. + + Can return all such variables or only those using :class:`~xvec.GeometryIndex`. + + Parameters + ---------- + name : coordinate variable name + has_index : bool, optional + control if all variables are returned (``False``) or only those that have + :class:`xvec.GeometryIndex` assigned (``True``). By default ``False`` + + Returns + ------- + bool + + Examples + -------- + + >>> ds = ( + ... xr.Dataset( + ... coords={ + ... "geom": np.array([shapely.Point(1, 2), shapely.Point(3, 4)]), + ... "geom2": np.array([shapely.Point(1, 2), shapely.Point(3, 4)]), + ... "foo": np.array([1, 2]), + ... } + ... ) + ... .drop_indexes(["geom"]) + ... .set_xindex("geom", xvec.GeometryIndex, crs=26915) + ... ) + >>> ds + + Dimensions: (geom: 2, geom2: 2, foo: 2) + Coordinates: + * geom (geom) object POINT (1 2) POINT (3 4) + * geom2 (geom2) object POINT (1 2) POINT (3 4) + * foo (foo) int64 1 2 + Data variables: + *empty* + Indexes: + geom GeometryIndex (crs=EPSG:26915) + >>> ds.xvec.is_geom_variable("geom") + True + >>> ds.xvec.is_geom_variable("foo") + False + >>> ds.xvec.is_geom_variable("geom2") + False + >>> ds.xvec.is_geom_variable("geom2", has_index=False) + True + + See also + -------- + geom_coords + geom_coords_indexed + """ + if isinstance(self._obj.xindexes.get(name), GeometryIndex): + return True + if not has_index: + if self._obj[name].dtype is np.dtype("O"): + # try first on a small subset + subset = self._obj[name].data[0:10] + if np.all(shapely.is_valid_input(subset)): + return np.all(shapely.is_valid_input(self._obj[name].data)) + return False + + @property + def geom_coords(self) -> Mapping[Hashable, xr.DataArray]: + """Returns a dictionary of xarray.DataArray objects corresponding to + coordinate variables composed of :class:`shapely.Geometry` objects. + + Examples + -------- + >>> ds = ( + ... xr.Dataset( + ... coords={ + ... "geom": np.array([shapely.Point(1, 2), shapely.Point(3, 4)]), + ... "geom_z": np.array( + ... [shapely.Point(10, 20, 30), shapely.Point(30, 40, 50)] + ... ), + ... "geom_no_index": np.array( + ... [shapely.Point(1, 2), shapely.Point(3, 4)] + ... ), + ... } + ... ) + ... .drop_indexes(["geom", "geom_z"]) + ... .set_xindex("geom", xvec.GeometryIndex, crs=26915) + ... .set_xindex("geom_z", xvec.GeometryIndex, crs=26915) + ... ) + >>> ds + + Dimensions: (geom: 2, geom_z: 2, geom_no_index: 2) + Coordinates: + * geom (geom) object POINT (1 2) POINT (3 4) + * geom_z (geom_z) object POINT Z (10 20 30) POINT Z (30 40 50) + * geom_no_index (geom_no_index) object POINT (1 2) POINT (3 4) + Data variables: + *empty* + Indexes: + geom GeometryIndex (crs=EPSG:26915) + geom_z GeometryIndex (crs=EPSG:26915) + >>> ds.xvec.geom_coords + Coordinates: + * geom (geom) object POINT (1 2) POINT (3 4) + * geom_z (geom_z) object POINT Z (10 20 30) POINT Z (30 40 50) + * geom_no_index (geom_no_index) object POINT (1 2) POINT (3 4) + + See also + -------- + geom_coords_indexed + is_geom_variable + """ + return self._obj[self._geom_coords_all].coords + + @property + def geom_coords_indexed(self) -> Mapping[Hashable, xr.DataArray]: + """Returns a dictionary of xarray.DataArray objects corresponding to + coordinate variables using :class:`~xvec.GeometryIndex`. + + Examples + -------- + >>> ds = ( + ... xr.Dataset( + ... coords={ + ... "geom": np.array([shapely.Point(1, 2), shapely.Point(3, 4)]), + ... "geom_z": np.array( + ... [shapely.Point(10, 20, 30), shapely.Point(30, 40, 50)] + ... ), + ... "geom_no_index": np.array( + ... [shapely.Point(1, 2), shapely.Point(3, 4)] + ... ), + ... } + ... ) + ... .drop_indexes(["geom", "geom_z"]) + ... .set_xindex("geom", xvec.GeometryIndex, crs=26915) + ... .set_xindex("geom_z", xvec.GeometryIndex, crs=26915) + ... ) + >>> ds + + Dimensions: (geom: 2, geom_z: 2, geom_no_index: 2) + Coordinates: + * geom (geom) object POINT (1 2) POINT (3 4) + * geom_z (geom_z) object POINT Z (10 20 30) POINT Z (30 40 50) + * geom_no_index (geom_no_index) object POINT (1 2) POINT (3 4) + Data variables: + *empty* + Indexes: + geom GeometryIndex (crs=EPSG:26915) + geom_z GeometryIndex (crs=EPSG:26915) + >>> ds.xvec.geom_coords_indexed + >>> ds.xvec.geom_coords_indexed + Coordinates: + * geom (geom) object POINT (1 2) POINT (3 4) + * geom_z (geom_z) object POINT Z (10 20 30) POINT Z (30 40 50) + + See also + -------- + geom_coords + is_geom_variable + + """ + return self._obj[self._geom_indexes].coords + + def to_crs( + self, + variable_crs: Mapping[Any, Any] | None = None, + **variable_crs_kwargs: Any, + ): + """ + Transform :class:`shapely.Geometry` objects of a variable to a new coordinate + reference system. + + Returns a new object with all the original data in addition to the transformed + variable. The CRS the current array must be set using + :class:`~xvec.GeometryIndex`. + + This method will transform all points in all objects. It has no notion or + projecting entire geometries. All segments joining points are assumed to be + lines in the current projection, not geodesics. Objects crossing the dateline + (or other projection boundary) will have undesirable behavior. + + Parameters + ---------- + variable_crs : dict-like or None, optional + A dict where the keys are the names of the coordinates and values target + CRS in any format accepted by + :meth:`pyproj.CRS.from_user_input() ` such + as an authority string (e.g. ``"EPSG:4326"``), EPSG code (e.g. ``4326``) or + a WKT string. + **variable_crs_kwargs : optional + The keyword arguments form of ``variable_crs``. + One of ``variable_crs`` or ``variable_crs_kwargs`` must be provided. + + Returns + ------- + assigned : same type as caller + A new object with the variables transformed to target CRSs. + + See also + -------- + set_crs + + Examples + -------- + Transform coordinates backed by :class:`~xvec.GeometryIndex` from `EPSG:4326` + to `ESPG:3857`. + + >>> da = ( + ... xr.DataArray( + ... np.random.rand(2), + ... coords={"geom": [shapely.Point(1, 2), shapely.Point(3, 4)]}, + ... dims="geom", + ... ) + ... .drop_indexes("geom") + ... .set_xindex("geom", xvec.GeometryIndex, crs=4326) + ... ) + >>> da + + array([0.47575118, 0.09271935]) + Coordinates: + * geom (geom) object POINT (1 2) POINT (3 4) + Indexes: + geom GeometryIndex (crs=EPSG:4326) + >>> da.xvec.to_crs(geom=3857) + + array([0.47575118, 0.09271935]) + Coordinates: + * geom (geom) object POINT (111319.49079327357 222684.20850554405) POIN... + Indexes: + geom GeometryIndex (crs=EPSG:3857) + + The same can be done using dictionary arguments. + + >>> da.xvec.to_crs({"geom": 3857}) + + array([0.47575118, 0.09271935]) + Coordinates: + * geom (geom) object POINT (111319.49079327357 222684.20850554405) POIN... + Indexes: + geom GeometryIndex (crs=EPSG:3857) + + The same applies to a :class:`xarray.Dataset`. + + >>> ds = ( + ... xr.Dataset(coords={"geom": [shapely.Point(1, 2), shapely.Point(3, 4)]}) + ... .drop_indexes("geom") + ... .set_xindex("geom", xvec.GeometryIndex, crs=4326) + ... ) + >>> ds + + Dimensions: (geom: 2) + Coordinates: + * geom (geom) object POINT (1 2) POINT (3 4) + Data variables: + *empty* + Indexes: + geom GeometryIndex (crs=EPSG:4326) + >>> ds.xvec.to_crs(geom=3857) + + Dimensions: (geom: 2) + Coordinates: + * geom (geom) object POINT (111319.49079327357 222684.20850554405) POIN... + Data variables: + *empty* + Indexes: + geom GeometryIndex (crs=EPSG:3857) + + Notes + ----- + Currently supports only :class:`xarray.Variable` objects that are set as + coordinates with :class:`~xvec.GeometryIndex` assigned. The implementation + currently wraps :meth:`Dataset.assign_coords ` + or :meth:`DataArray.assign_coords `. + """ + if variable_crs and variable_crs_kwargs: + raise ValueError( + "Cannot specify both keyword and positional arguments to " + "'.xvec.to_crs'." + ) + + _obj = self._obj.copy(deep=False) + + if variable_crs_kwargs: + variable_crs = variable_crs_kwargs + + transformed = {} + + for key, crs in variable_crs.items(): + + data = _obj[key] + data_crs = self._obj.xindexes[key].crs + + # transformation code taken from geopandas (BSD 3-clause license) + if data_crs is None: + raise ValueError( + "Cannot transform naive geometries. " + f"Please set a CRS on the '{key}' coordinates first." + ) + + crs = CRS.from_user_input(crs) + + if data_crs.is_exact_same(crs): + pass + + transformer = Transformer.from_crs(data_crs, crs, always_xy=True) + + has_z = shapely.has_z(data) + + result = np.empty_like(data) + + coordinates = shapely.get_coordinates(data[~has_z], include_z=False) + new_coords = transformer.transform(coordinates[:, 0], coordinates[:, 1]) + result[~has_z] = shapely.set_coordinates( + data[~has_z].copy(), np.array(new_coords).T + ) + + coords_z = shapely.get_coordinates(data[has_z], include_z=True) + new_coords_z = transformer.transform( + coords_z[:, 0], coords_z[:, 1], coords_z[:, 2] + ) + result[has_z] = shapely.set_coordinates( + data[has_z].copy(), np.array(new_coords_z).T + ) + + transformed[key] = (result, crs) + + for key, (result, crs) in transformed.items(): + _obj = _obj.assign_coords({key: result}) + + _obj = _obj.drop_indexes(variable_crs.keys()) + + for key, crs in variable_crs.items(): + _obj = _obj.set_xindex(key, GeometryIndex, crs=crs) + + return _obj + + def set_crs( + self, + variable_crs: Mapping[Any, Any] | None = None, + allow_override=False, + **variable_crs_kwargs: Any, + ): + """Set the Coordinate Reference System (CRS) of coordinates backed by + :class:`~xvec.GeometryIndex`. + + Parameters + ---------- + variable_crs : dict-like or None, optional + A dict where the keys are the names of the coordinates and values target + CRS in any format accepted by + :meth:`pyproj.CRS.from_user_input() ` such + as an authority string (e.g. ``"EPSG:4326"``), EPSG code (e.g. ``4326``) or + a WKT string. + allow_override : bool, default False + If the the :class:`~xvec.GeometryIndex` already has a CRS, + allow to replace the existing CRS, even when both are not equal. + **variable_crs_kwargs : optional + The keyword arguments form of ``variable_crs``. + One of ``variable_crs`` or ``variable_crs_kwargs`` must be provided. + + Returns + ------- + assigned : same type as caller + A new object with the assigned target CRS. + + See also + -------- + to_crs + + Examples + -------- + The method is the most useful, when there is no CRS assigned (illustrated on + a :class:`xarray.Dataset` but the same is applicable on + a :class:`xarray.DataArray`). + + >>> ds = ( + ... xr.Dataset(coords={"geom": [shapely.Point(1, 2), shapely.Point(3, 4)]}) + ... .drop_indexes("geom") + ... .set_xindex("geom", xvec.GeometryIndex) + ... ) + >>> ds + + Dimensions: (geom: 2) + Coordinates: + * geom (geom) object POINT (1 2) POINT (3 4) + Data variables: + *empty* + Indexes: + geom GeometryIndex (crs=None) + >>> ds.xvec.set_crs(geom=4326) + + Dimensions: (geom: 2) + Coordinates: + * geom (geom) object POINT (1 2) POINT (3 4) + Data variables: + *empty* + Indexes: + geom GeometryIndex (crs=EPSG:4326) + + It can also be used to overwrite the existing CRS. Note, that in most cases + you probably want to use the :meth:`to_crs` instead is such a case. + + >>> ds = ( + ... xr.Dataset(coords={"geom": [shapely.Point(1, 2), shapely.Point(3, 4)]}) + ... .drop_indexes("geom") + ... .set_xindex("geom", xvec.GeometryIndex, crs=4326) + ... ) + >>> ds + + Dimensions: (geom: 2) + Coordinates: + * geom (geom) object POINT (1 2) POINT (3 4) + Data variables: + *empty* + Indexes: + geom GeometryIndex (crs=EPSG:4326) + >>> ds.xvec.set_crs(geom=3857, allow_override=True) + + Dimensions: (geom: 2) + Coordinates: + * geom (geom) object POINT (1 2) POINT (3 4) + Data variables: + *empty* + Indexes: + geom GeometryIndex (crs=EPSG:3857) + + See that only the CRS has changed, not the geometries. + + + Notes + ----- + The underlying geometries are not transformed to this CRS. To + transform the geometries to a new CRS, use the :meth:`to_crs` + method. + """ + + if variable_crs and variable_crs_kwargs: + raise ValueError( + "Cannot specify both keyword and positional arguments to " + ".xvec.set_crs." + ) + + _obj = self._obj.copy(deep=False) + + if variable_crs_kwargs: + variable_crs = variable_crs_kwargs + + for key, crs in variable_crs.items(): + + data_crs = self._obj.xindexes[key].crs + + if not allow_override and data_crs is not None and not data_crs == crs: + raise ValueError( + f"The index '{key}' already has a CRS which is not equal to the " + "passed CRS. Specify 'allow_override=True' to allow replacing the " + "existing CRS without doing any transformation. If you actually " + "want to transform the geometries, use '.xvec.to_crs' instead." + ) + + _obj = _obj.drop_indexes(variable_crs.keys()) + + for key, crs in variable_crs.items(): + _obj = _obj.set_xindex(key, GeometryIndex, crs=crs) + + return _obj diff --git a/xvec/tests/conftest.py b/xvec/tests/conftest.py new file mode 100644 index 0000000..c3e6455 --- /dev/null +++ b/xvec/tests/conftest.py @@ -0,0 +1,92 @@ +import numpy as np +import pytest +import shapely +import xarray as xr +from pyproj import CRS + +from xvec import GeometryIndex + + +@pytest.fixture(scope="session") +def geom_array(): + return np.array([shapely.Point(1, 2), shapely.Point(3, 4)]) + + +@pytest.fixture(scope="session") +def geom_array_z(): + return np.array([shapely.Point(10, 20, 30), shapely.Point(30, 40, 50)]) + + +@pytest.fixture(scope="session") +def geom_dataset_no_index(geom_array): + # a dataset with a geometry coordinate but no index + ds = xr.Dataset(coords={"geom": geom_array}) + return ds.drop_indexes("geom") + + +@pytest.fixture(scope="session") +def geom_dataset(geom_dataset_no_index): + # a dataset with a geometry coordinate baked by a GeometryIndex + crs = CRS.from_user_input(26915) + return geom_dataset_no_index.set_xindex("geom", GeometryIndex, crs=crs) + + +@pytest.fixture(scope="session") +def geom_dataset_no_crs(geom_dataset_no_index): + # a dataset with a geometry coordinate baked by a GeometryIndex (no CRS) + return geom_dataset_no_index.set_xindex("geom", GeometryIndex) + + +@pytest.fixture(scope="session") +def first_geom_dataset(geom_dataset, geom_array): + return ( + xr.Dataset(coords={"geom": [geom_array[0]]}) + .drop_indexes("geom") + .set_xindex("geom", GeometryIndex, crs=geom_dataset.xindexes["geom"].crs) + ) + + +@pytest.fixture(scope="session") +def multi_geom_dataset(geom_array, geom_array_z): + return ( + xr.Dataset( + coords={ + "geom": geom_array, + "geom_z": geom_array_z, + } + ) + .drop_indexes(["geom", "geom_z"]) + .set_xindex("geom", GeometryIndex, crs=26915) + .set_xindex("geom_z", GeometryIndex, crs=26915) + ) + + +@pytest.fixture(scope="session") +def multi_geom_no_index_dataset(geom_array, geom_array_z): + return ( + xr.Dataset( + coords={ + "geom": geom_array, + "geom_z": geom_array_z, + "geom_no_ix": geom_array, + } + ) + .drop_indexes(["geom", "geom_z"]) + .set_xindex("geom", GeometryIndex, crs=26915) + .set_xindex("geom_z", GeometryIndex, crs=26915) + ) + + +@pytest.fixture(scope="session") +def multi_geom_one_ix_foo(geom_array): + return ( + xr.Dataset( + coords={ + "geom": geom_array, + "geom2": geom_array, + "foo": np.array([1, 2]), + } + ) + .drop_indexes(["geom"]) + .set_xindex("geom", GeometryIndex, crs=26915) + ) diff --git a/xvec/tests/test_accessor.py b/xvec/tests/test_accessor.py new file mode 100644 index 0000000..14e3b86 --- /dev/null +++ b/xvec/tests/test_accessor.py @@ -0,0 +1,189 @@ +import numpy as np +import pytest +import shapely +import xarray as xr + +import xvec # noqa +from xvec import GeometryIndex + + +@pytest.fixture() +def geom_array_4326(): + return shapely.from_wkt( + ["POINT (-97.488735 0.000018)", "POINT (-97.488717 0.000036)"] + ) + + +@pytest.fixture() +def geom_array_z_4326(): + return shapely.from_wkt( + ["POINT Z (-97.488654 0.00018 30)", "POINT Z (-97.488475 0.000361 50)"] + ) + + +@pytest.fixture() +def mixed_geom_dims_dataset(geom_array, geom_array_z): + return ( + xr.Dataset(coords={"geom": np.concatenate([geom_array, geom_array_z])}) + .drop_indexes("geom") + .set_xindex("geom", GeometryIndex, crs=26915) + ) + + +@pytest.fixture() +def geom_array_mixed_4326(geom_array_4326, geom_array_z_4326): + return np.concatenate([geom_array_4326, geom_array_z_4326]) + + +# Test .xvec accessor + + +def test_accessor(multi_geom_dataset): + assert hasattr(multi_geom_dataset, "xvec") + xr.testing.assert_identical(multi_geom_dataset.xvec._obj, multi_geom_dataset) + + +# Test .xvec geom_coords + + +def test_geom_coords(multi_geom_no_index_dataset): + assert multi_geom_no_index_dataset.xvec._geom_coords_all == [ + "geom", + "geom_z", + "geom_no_ix", + ] + + actual = multi_geom_no_index_dataset.xvec.geom_coords + expected = multi_geom_no_index_dataset.coords + actual.keys() == expected.keys() + + # check assignment + with pytest.raises(AttributeError): + multi_geom_no_index_dataset.xvec.geom_coords = ( + multi_geom_no_index_dataset.coords + ) + + +def test_geom_coords_indexed(multi_geom_no_index_dataset): + assert multi_geom_no_index_dataset.xvec._geom_indexes == ["geom", "geom_z"] + + actual = multi_geom_no_index_dataset.xvec.geom_coords_indexed + expected = multi_geom_no_index_dataset.coords + actual.keys() == expected.keys() + + # check assignment + with pytest.raises(AttributeError): + multi_geom_no_index_dataset.xvec.geom_coords = ( + multi_geom_no_index_dataset.coords + ) + + +# Test .xvec.is_geom_variable +@pytest.mark.parametrize( + "label,has_index,expected", + [ + ("geom", True, True), + ("geom", False, True), + ("geom2", True, False), + ("geom2", False, True), + ("foo", True, False), + ("foo", False, False), + ], +) +def test_is_geom_variable(multi_geom_one_ix_foo, label, has_index, expected): + assert ( + multi_geom_one_ix_foo.xvec.is_geom_variable(label, has_index=has_index) + == expected + ) + + +# Test .xvec.to_crs + + +def test_to_crs(geom_dataset, geom_array_4326): + transformed = geom_dataset.xvec.to_crs(geom=4326) + assert shapely.equals_exact(geom_array_4326, transformed.geom, tolerance=1e-5).all() + assert transformed.xindexes["geom"].crs.equals(4326) + + +def test_to_crs_two_geoms(multi_geom_dataset, geom_array_4326, geom_array_z_4326): + transformed = multi_geom_dataset.xvec.to_crs(geom=4326, geom_z=4326) + assert shapely.equals_exact(geom_array_4326, transformed.geom, tolerance=1e-5).all() + assert shapely.equals_exact( + geom_array_z_4326, transformed.geom_z, tolerance=1e-5 + ).all() + assert transformed.xindexes["geom"].crs.equals(4326) + assert transformed.xindexes["geom_z"].crs.equals(4326) + + +def test_to_crs_dict(multi_geom_dataset, geom_array_4326, geom_array_z_4326): + transformed = multi_geom_dataset.xvec.to_crs({"geom": 4326, "geom_z": 4326}) + assert shapely.equals_exact(geom_array_4326, transformed.geom, tolerance=1e-5).all() + assert shapely.equals_exact( + geom_array_z_4326, transformed.geom_z, tolerance=1e-5 + ).all() + assert transformed.xindexes["geom"].crs.equals(4326) + assert transformed.xindexes["geom_z"].crs.equals(4326) + + +def test_to_crs_arg_err(multi_geom_dataset): + with pytest.raises(ValueError, match="Cannot specify both keyword"): + multi_geom_dataset.xvec.to_crs(geom=4326, variable_crs={"geom_z": 4326}) + + +def test_to_crs_naive(geom_dataset_no_crs): + with pytest.raises(ValueError, match="Cannot transform naive geometries."): + geom_dataset_no_crs.xvec.to_crs(geom=4326) + + +def test_to_crs_same(geom_dataset): + transformed = geom_dataset.xvec.to_crs(geom=26915) + xr.testing.assert_identical(transformed, geom_dataset) + + +def test_to_crs_mixed_geom_dims(mixed_geom_dims_dataset, geom_array_mixed_4326): + transformed = mixed_geom_dims_dataset.xvec.to_crs(geom=4326) + assert shapely.equals_exact( + geom_array_mixed_4326, transformed.geom, tolerance=1e-5 + ).all() + assert transformed.xindexes["geom"].crs.equals(4326) + + +# Test .xvec.set_crs + + +def test_set_crs(geom_dataset_no_crs): + with_crs = geom_dataset_no_crs.xvec.set_crs(geom=4326) + assert with_crs.xindexes["geom"].crs.equals(4326) + + +def test_set_crs_dict(geom_dataset_no_crs): + with_crs = geom_dataset_no_crs.xvec.set_crs({"geom": 4326}) + assert with_crs.xindexes["geom"].crs.equals(4326) + + +def test_set_crs_arg_err(multi_geom_dataset): + with pytest.raises(ValueError, match="Cannot specify both keyword"): + multi_geom_dataset.xvec.set_crs(geom=4326, variable_crs={"geom_z": 4326}) + + +def test_set_crs_mismatch(geom_dataset): + with pytest.raises(ValueError, match="The index 'geom' already has a CRS"): + geom_dataset.xvec.set_crs(geom=4326) + + +def test_set_crs_override(geom_dataset, geom_array): + with_crs = geom_dataset.xvec.set_crs(allow_override=True, geom=4326) + # new CRS + assert with_crs.xindexes["geom"].crs.equals(4326) + # same geometries + assert shapely.equals_exact( + geom_array, + with_crs.geom, + ).all() + + +def test_set_crs_multiple(multi_geom_dataset): + with_crs = multi_geom_dataset.xvec.to_crs(geom=4326, geom_z=4326) + assert with_crs.xindexes["geom"].crs.equals(4326) + assert with_crs.xindexes["geom_z"].crs.equals(4326) diff --git a/xvec/tests/test_index.py b/xvec/tests/test_index.py index efd9fdd..53fb8f4 100644 --- a/xvec/tests/test_index.py +++ b/xvec/tests/test_index.py @@ -7,40 +7,6 @@ from xvec import GeometryIndex -@pytest.fixture(scope="session") -def geom_array(): - return np.array([shapely.Point(1, 2), shapely.Point(3, 4)]) - - -@pytest.fixture(scope="session") -def geom_dataset_no_index(geom_array): - # a dataset with a geometry coordinate but no index - ds = xr.Dataset(coords={"geom": geom_array}) - return ds.drop_indexes("geom") - - -@pytest.fixture(scope="session") -def geom_dataset(geom_dataset_no_index): - # a dataset with a geometry coordinate baked by a GeometryIndex - crs = CRS.from_user_input(26915) - return geom_dataset_no_index.set_xindex("geom", GeometryIndex, crs=crs) - - -@pytest.fixture(scope="session") -def geom_dataset_no_crs(geom_dataset_no_index): - # a dataset with a geometry coordinate baked by a GeometryIndex (no CRS) - return geom_dataset_no_index.set_xindex("geom", GeometryIndex) - - -@pytest.fixture(scope="session") -def first_geom_dataset(geom_dataset, geom_array): - return ( - xr.Dataset(coords={"geom": [geom_array[0]]}) - .drop_indexes("geom") - .set_xindex("geom", GeometryIndex, crs=geom_dataset.xindexes["geom"].crs) - ) - - def test_set_index(geom_dataset_no_index): crs = CRS.from_user_input(26915) ds = geom_dataset_no_index.set_xindex("geom", GeometryIndex, crs=crs)