diff --git a/ci/requirements.txt b/ci/requirements.txt index ffa72e18..e703d88b 100644 --- a/ci/requirements.txt +++ b/ci/requirements.txt @@ -1,6 +1,7 @@ pint numpy scipy +dask[array] bottleneck xarray isort diff --git a/docs/api.rst b/docs/api.rst index a165f460..3d4269d1 100644 --- a/docs/api.rst +++ b/docs/api.rst @@ -28,6 +28,7 @@ Dataset xarray.Dataset.pint.drop_sel xarray.Dataset.pint.sel xarray.Dataset.pint.to + xarray.Dataset.pint.chunk xarray.Dataset.pint.ffill xarray.Dataset.pint.bfill @@ -57,6 +58,7 @@ DataArray xarray.DataArray.pint.drop_sel xarray.DataArray.pint.sel xarray.DataArray.pint.to + xarray.DataArray.pint.chunk xarray.DataArray.pint.ffill xarray.DataArray.pint.bfill diff --git a/docs/whats-new.rst b/docs/whats-new.rst index 12b0dc65..d4840877 100644 --- a/docs/whats-new.rst +++ b/docs/whats-new.rst @@ -29,6 +29,8 @@ What's new By `Justus Magin `_. - implement :py:meth:`Dataset.pint.drop_sel` and :py:meth:`DataArray.pint.drop_sel` (:pull:`73`). By `Justus Magin `_. +- implement :py:meth:`Dataset.pint.chunk` and :py:meth:`DataArray.pint.chunk` (:pull:`83`). + By `Justus Magin `_. - implement :py:meth:`Dataset.pint.reindex`, :py:meth:`Dataset.pint.reindex_like`, :py:meth:`DataArray.pint.reindex` and :py:meth:`DataArray.pint.reindex_like` (:pull:`69`). By `Justus Magin `_. diff --git a/pint_xarray/accessors.py b/pint_xarray/accessors.py index 952bbe34..7a7de903 100644 --- a/pint_xarray/accessors.py +++ b/pint_xarray/accessors.py @@ -569,6 +569,29 @@ def to(self, units=None, **unit_kwargs): return conversion.convert_units(self.da, units) + def chunk(self, chunks, name_prefix="xarray-", token=None, lock=False): + """unit-aware version of chunk + + Like :py:meth:`xarray.DataArray.chunk`, but chunking a quantity will change the + wrapped type to ``dask``. + + .. note:: + It is recommended to only use this when chunking in-memory arrays. To + rechunk please use :py:meth:`xarray.DataArray.chunk`. + + See Also + -------- + xarray.DataArray.chunk + xarray.Dataset.pint.chunk + """ + units = conversion.extract_units(self.da) + stripped = conversion.strip_units(self.da) + + chunked = stripped.chunk( + chunks, name_prefix=name_prefix, token=token, lock=lock + ) + return conversion.attach_units(chunked, units) + def reindex( self, indexers=None, @@ -1267,6 +1290,29 @@ def to(self, units=None, **unit_kwargs): return conversion.convert_units(self.ds, units) + def chunk(self, chunks, name_prefix="xarray-", token=None, lock=False): + """unit-aware version of chunk + + Like :py:meth:`xarray.Dataset.chunk`, but chunking a quantity will change the + wrapped type to ``dask``. + + .. note:: + It is recommended to only use this when chunking in-memory arrays. To + rechunk please use :py:meth:`xarray.Dataset.chunk`. + + See Also + -------- + xarray.Dataset.chunk + xarray.DataArray.pint.chunk + """ + units = conversion.extract_units(self.ds) + stripped = conversion.strip_units(self.ds) + + chunked = stripped.chunk( + chunks, name_prefix=name_prefix, token=token, lock=lock + ) + return conversion.attach_units(chunked, units) + def reindex( self, indexers=None, diff --git a/pint_xarray/tests/test_accessors.py b/pint_xarray/tests/test_accessors.py index 7a65aa84..a1ff5758 100644 --- a/pint_xarray/tests/test_accessors.py +++ b/pint_xarray/tests/test_accessors.py @@ -814,6 +814,72 @@ def test_drop_sel(obj, indexers, expected, error): assert_identical(actual, expected) +@pytest.mark.parametrize( + "obj", + ( + pytest.param( + xr.Dataset( + {"a": ("x", np.linspace(0, 1, 11))}, + coords={"u": ("x", np.arange(11))}, + ), + id="Dataset-no units", + ), + pytest.param( + xr.Dataset( + { + "a": ( + "x", + Quantity(np.linspace(0, 1, 11), "m"), + ) + }, + coords={ + "u": ( + "x", + Quantity(np.arange(11), "m"), + ) + }, + ), + id="Dataset-units", + ), + pytest.param( + xr.DataArray( + np.linspace(0, 1, 11), + coords={ + "u": ( + "x", + np.arange(11), + ) + }, + dims="x", + ), + id="DataArray-no units", + ), + pytest.param( + xr.DataArray( + Quantity(np.linspace(0, 1, 11), "m"), + coords={ + "u": ( + "x", + Quantity(np.arange(11), "m"), + ) + }, + dims="x", + ), + id="DataArray-units", + ), + ), +) +def test_chunk(obj): + actual = obj.pint.chunk({"x": 2}) + + expected = ( + obj.pint.dequantify().chunk({"x": 2}).pint.quantify(unit_registry=unit_registry) + ) + + assert_units_equal(actual, expected) + assert_identical(actual, expected) + + @pytest.mark.parametrize( ["obj", "indexers", "expected", "error"], ( @@ -1484,7 +1550,7 @@ def test_interp_like(obj, other, expected, error): coords={ "u": ( "x", - Quantity([nan, 0, nan, 1, nan, nan, 2, nan], "m"), + [nan, 0, nan, 1, nan, nan, 2, nan], ) }, dims="x", @@ -1494,12 +1560,12 @@ def test_interp_like(obj, other, expected, error): coords={ "u": ( "x", - Quantity([nan, 0, nan, 1, nan, nan, 2, nan], "m"), + [nan, 0, nan, 1, nan, nan, 2, nan], ) }, dims="x", ), - id="DataArray-units", + id="DataArray-no units", ), pytest.param( xr.DataArray( @@ -1578,7 +1644,7 @@ def test_ffill(obj, expected): coords={ "u": ( "x", - Quantity([nan, 0, nan, 1, nan, nan, 2, nan], "m"), + [nan, 0, nan, 1, nan, nan, 2, nan], ) }, dims="x", @@ -1588,12 +1654,12 @@ def test_ffill(obj, expected): coords={ "u": ( "x", - Quantity([nan, 0, nan, 1, nan, nan, 2, nan], "m"), + [nan, 0, nan, 1, nan, nan, 2, nan], ) }, dims="x", ), - id="DataArray-units", + id="DataArray-no units", ), pytest.param( xr.DataArray(