From 8142742e6024cb3ecacdbc3d175500f153a28528 Mon Sep 17 00:00:00 2001
From: Aleksandar Jelenak <ajelenak@hdfgroup.org>
Date: Wed, 29 Jan 2020 12:05:23 -0500
Subject: [PATCH 1/7] Allow chunk store for Zarr datasets

---
 xarray/backends/zarr.py | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/xarray/backends/zarr.py b/xarray/backends/zarr.py
index 763769dac74..35f178d7041 100644
--- a/xarray/backends/zarr.py
+++ b/xarray/backends/zarr.py
@@ -250,10 +250,12 @@ def open_group(
         group=None,
         consolidated=False,
         consolidate_on_close=False,
+        chunk_store=None,
     ):
         import zarr
 
-        open_kwargs = dict(mode=mode, synchronizer=synchronizer, path=group)
+        open_kwargs = dict(mode=mode, synchronizer=synchronizer, path=group,
+                           chunk_store=chunk_store)
         if consolidated:
             # TODO: an option to pass the metadata_key keyword
             zarr_group = zarr.open_consolidated(store, **open_kwargs)
@@ -468,6 +470,7 @@ def open_zarr(
     drop_variables=None,
     consolidated=False,
     overwrite_encoded_chunks=False,
+    chunk_store=None,
     **kwargs,
 ):
     """Load and decode a dataset from a Zarr store.
@@ -527,6 +530,8 @@ def open_zarr(
     consolidated : bool, optional
         Whether to open the store using zarr's consolidated metadata
         capability. Only works for stores that have already been consolidated.
+    chunk_store : MutableMapping, optional
+        A separate Zarr store only for chunk data.
 
     Returns
     -------
@@ -595,6 +600,7 @@ def maybe_decode_store(store, lock=False):
         synchronizer=synchronizer,
         group=group,
         consolidated=consolidated,
+        chunk_store=chunk_store
     )
     ds = maybe_decode_store(zarr_store)
 

From a20ec978b0ab16ac737918aab51280972a0221f7 Mon Sep 17 00:00:00 2001
From: Aleksandar Jelenak <ajelenak@hdfgroup.org>
Date: Fri, 28 Feb 2020 13:16:26 -0500
Subject: [PATCH 2/7] Add test for open_zarr() chunk_store argument

---
 xarray/tests/test_backends.py | 10 ++++++++++
 1 file changed, 10 insertions(+)

diff --git a/xarray/tests/test_backends.py b/xarray/tests/test_backends.py
index bb77cbb94fe..5459bbc1ecb 100644
--- a/xarray/tests/test_backends.py
+++ b/xarray/tests/test_backends.py
@@ -1539,6 +1539,15 @@ def test_roundtrip_consolidated(self):
             self.check_dtypes_roundtripped(expected, actual)
             assert_identical(expected, actual)
 
+    def test_with_chunkstore(self):
+        save_kwargs = {}
+        expected = create_test_data()
+        with self.create_zarr_target() as store_target:
+            self.save(expected, store_target, **save_kwargs)
+            open_kwargs = {'chunk_store': store_target}
+            with self.open(store_target, **open_kwargs) as ds:
+                assert_equal(ds, expected)
+
     def test_auto_chunk(self):
         original = create_test_data().chunk()
 
@@ -1554,6 +1563,7 @@ def test_auto_chunk(self):
                 # only index variables should be in memory
                 assert v._in_memory == (k in actual.dims)
                 # chunk size should be the same as original
+
                 assert v.chunks == original[k].chunks
 
     @pytest.mark.filterwarnings("ignore:Specified Dask chunks")

From 9060925f135304ca7d0494eeedf807fd9d4ef96e Mon Sep 17 00:00:00 2001
From: Aleksandar Jelenak <ajelenak@hdfgroup.org>
Date: Wed, 15 Apr 2020 09:43:19 -0400
Subject: [PATCH 3/7] Add "chunk_store" argument to to_zarr()

---
 xarray/backends/api.py        | 4 ++++
 xarray/core/dataset.py        | 4 ++++
 xarray/tests/test_backends.py | 9 +++++----
 3 files changed, 13 insertions(+), 4 deletions(-)

diff --git a/xarray/backends/api.py b/xarray/backends/api.py
index c7481e22b59..1910d26a065 100644
--- a/xarray/backends/api.py
+++ b/xarray/backends/api.py
@@ -1297,6 +1297,7 @@ def _validate_append_dim_and_encoding(
 def to_zarr(
     dataset,
     store=None,
+    chunk_store=None,
     mode=None,
     synchronizer=None,
     group=None,
@@ -1312,6 +1313,8 @@ def to_zarr(
     """
     if isinstance(store, Path):
         store = str(store)
+    if isinstance(chunk_store, Path):
+        chunk_store = str(store)
     if encoding is None:
         encoding = {}
 
@@ -1336,6 +1339,7 @@ def to_zarr(
         synchronizer=synchronizer,
         group=group,
         consolidate_on_close=consolidated,
+        chunk_store=chunk_store
     )
     zstore.append_dim = append_dim
     writer = ArrayWriter()
diff --git a/xarray/core/dataset.py b/xarray/core/dataset.py
index dd1e31cc61a..be099f697f5 100644
--- a/xarray/core/dataset.py
+++ b/xarray/core/dataset.py
@@ -1560,6 +1560,7 @@ def to_netcdf(
     def to_zarr(
         self,
         store: Union[MutableMapping, str, Path] = None,
+        chunk_store: Union[MutableMapping, str, Path] = None,
         mode: str = None,
         synchronizer=None,
         group: str = None,
@@ -1578,6 +1579,8 @@ def to_zarr(
         ----------
         store : MutableMapping, str or Path, optional
             Store or path to directory in file system.
+        chunk_store : MutableMapping, str or Path, optional
+            Store or path to directory in file system only for Zarr array chunks.
         mode : {'w', 'w-', 'a', None}
             Persistence mode: 'w' means create (overwrite if exists);
             'w-' means create (fail if exists);
@@ -1628,6 +1631,7 @@ def to_zarr(
         return to_zarr(
             self,
             store=store,
+            chunk_store=chunk_store,
             mode=mode,
             synchronizer=synchronizer,
             group=group,
diff --git a/xarray/tests/test_backends.py b/xarray/tests/test_backends.py
index a4c1cf782e0..138b7058548 100644
--- a/xarray/tests/test_backends.py
+++ b/xarray/tests/test_backends.py
@@ -1544,11 +1544,12 @@ def test_roundtrip_consolidated(self):
             assert_identical(expected, actual)
 
     def test_with_chunkstore(self):
-        save_kwargs = {}
         expected = create_test_data()
-        with self.create_zarr_target() as store_target:
+        with self.create_zarr_target() as store_target, \
+                self.create_zarr_target() as chunk_store:
+            save_kwargs = {'chunk_store': chunk_store}
             self.save(expected, store_target, **save_kwargs)
-            open_kwargs = {'chunk_store': store_target}
+            open_kwargs = {'chunk_store': chunk_store}
             with self.open(store_target, **open_kwargs) as ds:
                 assert_equal(ds, expected)
 
@@ -1820,7 +1821,7 @@ def test_encoding_kwarg_fixed_width_string(self):
         # not relevant for zarr, since we don't use EncodedStringCoder
         pass
 
-    # TODO: someone who understand caching figure out whether chaching
+    # TODO: someone who understand caching figure out whether caching
     # makes sense for Zarr backend
     @pytest.mark.xfail(reason="Zarr caching not implemented")
     def test_dataset_caching(self):

From 752d9b73b38449fa9fb6d4bffa0169a79fa5d781 Mon Sep 17 00:00:00 2001
From: Aleksandar Jelenak <ajelenak@hdfgroup.org>
Date: Fri, 3 Jul 2020 12:02:23 -0400
Subject: [PATCH 4/7] Simplify chunk_store argument handling

---
 xarray/backends/zarr.py | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/xarray/backends/zarr.py b/xarray/backends/zarr.py
index 4cfec9ce211..33627ab54d6 100644
--- a/xarray/backends/zarr.py
+++ b/xarray/backends/zarr.py
@@ -280,8 +280,10 @@ def open_group(
     ):
         import zarr
 
-        open_kwargs = dict(mode=mode, synchronizer=synchronizer, path=group,
-                           chunk_store=chunk_store)
+        open_kwargs = dict(mode=mode, synchronizer=synchronizer, path=group)
+        if chunk_store:
+            open_kwargs['chunk_store'] = chunk_store
+
         if consolidated:
             # TODO: an option to pass the metadata_key keyword
             zarr_group = zarr.open_consolidated(store, **open_kwargs)

From 0979f858324f697c0b5c1852e9253972174391b2 Mon Sep 17 00:00:00 2001
From: dcherian <deepak@cherian.net>
Date: Tue, 28 Jul 2020 12:33:41 -0600
Subject: [PATCH 5/7] blacken

---
 xarray/backends/api.py        |   2 +-
 xarray/backends/zarr.py       |   4 +-
 xarray/tests/test_backends.py |   7 +-
 xarray/tests/test_sparse.py   | 889 ----------------------------------
 4 files changed, 6 insertions(+), 896 deletions(-)
 delete mode 100644 xarray/tests/test_sparse.py

diff --git a/xarray/backends/api.py b/xarray/backends/api.py
index b7a9fb50d25..d0e0ba7df8c 100644
--- a/xarray/backends/api.py
+++ b/xarray/backends/api.py
@@ -1349,7 +1349,7 @@ def to_zarr(
         synchronizer=synchronizer,
         group=group,
         consolidate_on_close=consolidated,
-        chunk_store=chunk_store
+        chunk_store=chunk_store,
     )
     zstore.append_dim = append_dim
     writer = ArrayWriter()
diff --git a/xarray/backends/zarr.py b/xarray/backends/zarr.py
index 33627ab54d6..cd1bf641d0b 100644
--- a/xarray/backends/zarr.py
+++ b/xarray/backends/zarr.py
@@ -282,7 +282,7 @@ def open_group(
 
         open_kwargs = dict(mode=mode, synchronizer=synchronizer, path=group)
         if chunk_store:
-            open_kwargs['chunk_store'] = chunk_store
+            open_kwargs["chunk_store"] = chunk_store
 
         if consolidated:
             # TODO: an option to pass the metadata_key keyword
@@ -651,7 +651,7 @@ def maybe_decode_store(store, lock=False):
         synchronizer=synchronizer,
         group=group,
         consolidated=consolidated,
-        chunk_store=chunk_store
+        chunk_store=chunk_store,
     )
     ds = maybe_decode_store(zarr_store)
 
diff --git a/xarray/tests/test_backends.py b/xarray/tests/test_backends.py
index 37e5b1efb9a..b56191edc8f 100644
--- a/xarray/tests/test_backends.py
+++ b/xarray/tests/test_backends.py
@@ -1566,11 +1566,10 @@ def test_roundtrip_consolidated(self):
 
     def test_with_chunkstore(self):
         expected = create_test_data()
-        with self.create_zarr_target() as store_target, \
-                self.create_zarr_target() as chunk_store:
-            save_kwargs = {'chunk_store': chunk_store}
+        with self.create_zarr_target() as store_target, self.create_zarr_target() as chunk_store:
+            save_kwargs = {"chunk_store": chunk_store}
             self.save(expected, store_target, **save_kwargs)
-            open_kwargs = {'chunk_store': chunk_store}
+            open_kwargs = {"chunk_store": chunk_store}
             with self.open(store_target, **open_kwargs) as ds:
                 assert_equal(ds, expected)
 
diff --git a/xarray/tests/test_sparse.py b/xarray/tests/test_sparse.py
deleted file mode 100644
index f3c09ba6a5f..00000000000
--- a/xarray/tests/test_sparse.py
+++ /dev/null
@@ -1,889 +0,0 @@
-import pickle
-from textwrap import dedent
-
-import numpy as np
-import pandas as pd
-import pytest
-
-import xarray as xr
-import xarray.ufuncs as xu
-from xarray import DataArray, Variable
-from xarray.core.npcompat import IS_NEP18_ACTIVE
-from xarray.core.pycompat import sparse_array_type
-
-from . import assert_equal, assert_identical, requires_dask
-
-param = pytest.param
-xfail = pytest.mark.xfail
-
-if not IS_NEP18_ACTIVE:
-    pytest.skip(
-        "NUMPY_EXPERIMENTAL_ARRAY_FUNCTION is not enabled", allow_module_level=True
-    )
-
-sparse = pytest.importorskip("sparse")
-
-
-def assert_sparse_equal(a, b):
-    assert isinstance(a, sparse_array_type)
-    assert isinstance(b, sparse_array_type)
-    np.testing.assert_equal(a.todense(), b.todense())
-
-
-def make_ndarray(shape):
-    return np.arange(np.prod(shape)).reshape(shape)
-
-
-def make_sparray(shape):
-    return sparse.random(shape, density=0.1, random_state=0)
-
-
-def make_xrvar(dim_lengths):
-    return xr.Variable(
-        tuple(dim_lengths.keys()), make_sparray(shape=tuple(dim_lengths.values()))
-    )
-
-
-def make_xrarray(dim_lengths, coords=None, name="test"):
-    if coords is None:
-        coords = {d: np.arange(n) for d, n in dim_lengths.items()}
-    return xr.DataArray(
-        make_sparray(shape=tuple(dim_lengths.values())),
-        dims=tuple(coords.keys()),
-        coords=coords,
-        name=name,
-    )
-
-
-class do:
-    def __init__(self, meth, *args, **kwargs):
-        self.meth = meth
-        self.args = args
-        self.kwargs = kwargs
-
-    def __call__(self, obj):
-        return getattr(obj, self.meth)(*self.args, **self.kwargs)
-
-    def __repr__(self):
-        return f"obj.{self.meth}(*{self.args}, **{self.kwargs})"
-
-
-@pytest.mark.parametrize(
-    "prop",
-    [
-        "chunks",
-        "data",
-        "dims",
-        "dtype",
-        "encoding",
-        "imag",
-        "nbytes",
-        "ndim",
-        param("values", marks=xfail(reason="Coercion to dense")),
-    ],
-)
-def test_variable_property(prop):
-    var = make_xrvar({"x": 10, "y": 5})
-    getattr(var, prop)
-
-
-@pytest.mark.parametrize(
-    "func,sparse_output",
-    [
-        (do("all"), False),
-        (do("any"), False),
-        (do("astype", dtype=int), True),
-        (do("clip", min=0, max=1), True),
-        (do("coarsen", windows={"x": 2}, func=np.sum), True),
-        (do("compute"), True),
-        (do("conj"), True),
-        (do("copy"), True),
-        (do("count"), False),
-        (do("get_axis_num", dim="x"), False),
-        (do("isel", x=slice(2, 4)), True),
-        (do("isnull"), True),
-        (do("load"), True),
-        (do("mean"), False),
-        (do("notnull"), True),
-        (do("roll"), True),
-        (do("round"), True),
-        (do("set_dims", dims=("x", "y", "z")), True),
-        (do("stack", dimensions={"flat": ("x", "y")}), True),
-        (do("to_base_variable"), True),
-        (do("transpose"), True),
-        (do("unstack", dimensions={"x": {"x1": 5, "x2": 2}}), True),
-        (do("broadcast_equals", make_xrvar({"x": 10, "y": 5})), False),
-        (do("equals", make_xrvar({"x": 10, "y": 5})), False),
-        (do("identical", make_xrvar({"x": 10, "y": 5})), False),
-        param(
-            do("argmax"),
-            True,
-            marks=xfail(reason="Missing implementation for np.argmin"),
-        ),
-        param(
-            do("argmin"),
-            True,
-            marks=xfail(reason="Missing implementation for np.argmax"),
-        ),
-        param(
-            do("argsort"),
-            True,
-            marks=xfail(reason="'COO' object has no attribute 'argsort'"),
-        ),
-        param(
-            do(
-                "concat",
-                variables=[
-                    make_xrvar({"x": 10, "y": 5}),
-                    make_xrvar({"x": 10, "y": 5}),
-                ],
-            ),
-            True,
-            marks=xfail(reason="Coercion to dense"),
-        ),
-        param(
-            do("conjugate"),
-            True,
-            marks=xfail(reason="'COO' object has no attribute 'conjugate'"),
-        ),
-        param(
-            do("cumprod"),
-            True,
-            marks=xfail(reason="Missing implementation for np.nancumprod"),
-        ),
-        param(
-            do("cumsum"),
-            True,
-            marks=xfail(reason="Missing implementation for np.nancumsum"),
-        ),
-        (do("fillna", 0), True),
-        param(
-            do("item", (1, 1)),
-            False,
-            marks=xfail(reason="'COO' object has no attribute 'item'"),
-        ),
-        param(
-            do("median"),
-            False,
-            marks=xfail(reason="Missing implementation for np.nanmedian"),
-        ),
-        param(do("max"), False),
-        param(do("min"), False),
-        param(
-            do("no_conflicts", other=make_xrvar({"x": 10, "y": 5})),
-            True,
-            marks=xfail(reason="mixed sparse-dense operation"),
-        ),
-        param(
-            do("pad", mode="constant", pad_widths={"x": (1, 1)}, fill_value=5),
-            True,
-            marks=xfail(reason="Missing implementation for np.pad"),
-        ),
-        (do("prod"), False),
-        param(
-            do("quantile", q=0.5),
-            True,
-            marks=xfail(reason="Missing implementation for np.nanpercentile"),
-        ),
-        param(
-            do("rank", dim="x"),
-            False,
-            marks=xfail(reason="Only implemented for NumPy arrays (via bottleneck)"),
-        ),
-        param(
-            do("reduce", func=np.sum, dim="x"),
-            True,
-            marks=xfail(reason="Coercion to dense"),
-        ),
-        param(
-            do("rolling_window", dim="x", window=2, window_dim="x_win"),
-            True,
-            marks=xfail(reason="Missing implementation for np.pad"),
-        ),
-        param(
-            do("shift", x=2), True, marks=xfail(reason="mixed sparse-dense operation")
-        ),
-        param(
-            do("std"), False, marks=xfail(reason="Missing implementation for np.nanstd")
-        ),
-        (do("sum"), False),
-        param(
-            do("var"), False, marks=xfail(reason="Missing implementation for np.nanvar")
-        ),
-        param(do("to_dict"), False, marks=xfail(reason="Coercion to dense")),
-        (do("where", cond=make_xrvar({"x": 10, "y": 5}) > 0.5), True),
-    ],
-    ids=repr,
-)
-def test_variable_method(func, sparse_output):
-    var_s = make_xrvar({"x": 10, "y": 5})
-    var_d = xr.Variable(var_s.dims, var_s.data.todense())
-    ret_s = func(var_s)
-    ret_d = func(var_d)
-
-    if sparse_output:
-        assert isinstance(ret_s.data, sparse.SparseArray)
-        assert np.allclose(ret_s.data.todense(), ret_d.data, equal_nan=True)
-    else:
-        assert np.allclose(ret_s, ret_d, equal_nan=True)
-
-
-@pytest.mark.parametrize(
-    "func,sparse_output",
-    [
-        (do("squeeze"), True),
-        param(do("to_index"), False, marks=xfail(reason="Coercion to dense")),
-        param(do("to_index_variable"), False, marks=xfail(reason="Coercion to dense")),
-        param(
-            do("searchsorted", 0.5),
-            True,
-            marks=xfail(reason="'COO' object has no attribute 'searchsorted'"),
-        ),
-    ],
-)
-def test_1d_variable_method(func, sparse_output):
-    var_s = make_xrvar({"x": 10})
-    var_d = xr.Variable(var_s.dims, var_s.data.todense())
-    ret_s = func(var_s)
-    ret_d = func(var_d)
-
-    if sparse_output:
-        assert isinstance(ret_s.data, sparse.SparseArray)
-        assert np.allclose(ret_s.data.todense(), ret_d.data)
-    else:
-        assert np.allclose(ret_s, ret_d)
-
-
-class TestSparseVariable:
-    @pytest.fixture(autouse=True)
-    def setUp(self):
-        self.data = sparse.random((4, 6), random_state=0, density=0.5)
-        self.var = xr.Variable(("x", "y"), self.data)
-
-    def test_unary_op(self):
-        assert_sparse_equal(-self.var.data, -self.data)
-        assert_sparse_equal(abs(self.var).data, abs(self.data))
-        assert_sparse_equal(self.var.round().data, self.data.round())
-
-    @pytest.mark.filterwarnings("ignore::PendingDeprecationWarning")
-    def test_univariate_ufunc(self):
-        assert_sparse_equal(np.sin(self.data), xu.sin(self.var).data)
-
-    @pytest.mark.filterwarnings("ignore::PendingDeprecationWarning")
-    def test_bivariate_ufunc(self):
-        assert_sparse_equal(np.maximum(self.data, 0), xu.maximum(self.var, 0).data)
-        assert_sparse_equal(np.maximum(self.data, 0), xu.maximum(0, self.var).data)
-
-    def test_repr(self):
-        expected = dedent(
-            """\
-            <xarray.Variable (x: 4, y: 6)>
-            <COO: shape=(4, 6), dtype=float64, nnz=12, fill_value=0.0>"""
-        )
-        assert expected == repr(self.var)
-
-    def test_pickle(self):
-        v1 = self.var
-        v2 = pickle.loads(pickle.dumps(v1))
-        assert_sparse_equal(v1.data, v2.data)
-
-    def test_missing_values(self):
-        a = np.array([0, 1, np.nan, 3])
-        s = sparse.COO.from_numpy(a)
-        var_s = Variable("x", s)
-        assert np.all(var_s.fillna(2).data.todense() == np.arange(4))
-        assert np.all(var_s.count() == 3)
-
-
-@pytest.mark.parametrize(
-    "prop",
-    [
-        "attrs",
-        "chunks",
-        "coords",
-        "data",
-        "dims",
-        "dtype",
-        "encoding",
-        "imag",
-        "indexes",
-        "loc",
-        "name",
-        "nbytes",
-        "ndim",
-        "plot",
-        "real",
-        "shape",
-        "size",
-        "sizes",
-        "str",
-        "variable",
-    ],
-)
-def test_dataarray_property(prop):
-    arr = make_xrarray({"x": 10, "y": 5})
-    getattr(arr, prop)
-
-
-@pytest.mark.parametrize(
-    "func,sparse_output",
-    [
-        (do("all"), False),
-        (do("any"), False),
-        (do("assign_attrs", {"foo": "bar"}), True),
-        (do("assign_coords", x=make_xrarray({"x": 10}).x + 1), True),
-        (do("astype", int), True),
-        (do("clip", min=0, max=1), True),
-        (do("compute"), True),
-        (do("conj"), True),
-        (do("copy"), True),
-        (do("count"), False),
-        (do("diff", "x"), True),
-        (do("drop_vars", "x"), True),
-        (do("expand_dims", {"z": 2}, axis=2), True),
-        (do("get_axis_num", "x"), False),
-        (do("get_index", "x"), False),
-        (do("identical", make_xrarray({"x": 5, "y": 5})), False),
-        (do("integrate", "x"), True),
-        (do("isel", {"x": slice(0, 3), "y": slice(2, 4)}), True),
-        (do("isnull"), True),
-        (do("load"), True),
-        (do("mean"), False),
-        (do("persist"), True),
-        (do("reindex", {"x": [1, 2, 3]}), True),
-        (do("rename", "foo"), True),
-        (do("reorder_levels"), True),
-        (do("reset_coords", drop=True), True),
-        (do("reset_index", "x"), True),
-        (do("round"), True),
-        (do("sel", x=[0, 1, 2]), True),
-        (do("shift"), True),
-        (do("sortby", "x", ascending=False), True),
-        (do("stack", z={"x", "y"}), True),
-        (do("transpose"), True),
-        # TODO
-        # set_index
-        # swap_dims
-        (do("broadcast_equals", make_xrvar({"x": 10, "y": 5})), False),
-        (do("equals", make_xrvar({"x": 10, "y": 5})), False),
-        param(
-            do("argmax"),
-            True,
-            marks=xfail(reason="Missing implementation for np.argmax"),
-        ),
-        param(
-            do("argmin"),
-            True,
-            marks=xfail(reason="Missing implementation for np.argmin"),
-        ),
-        param(
-            do("argsort"),
-            True,
-            marks=xfail(reason="'COO' object has no attribute 'argsort'"),
-        ),
-        param(
-            do("bfill", dim="x"),
-            False,
-            marks=xfail(reason="Missing implementation for np.flip"),
-        ),
-        (do("combine_first", make_xrarray({"x": 10, "y": 5})), True),
-        param(
-            do("conjugate"),
-            False,
-            marks=xfail(reason="'COO' object has no attribute 'conjugate'"),
-        ),
-        param(
-            do("cumprod"),
-            True,
-            marks=xfail(reason="Missing implementation for np.nancumprod"),
-        ),
-        param(
-            do("cumsum"),
-            True,
-            marks=xfail(reason="Missing implementation for np.nancumsum"),
-        ),
-        param(
-            do("differentiate", "x"),
-            False,
-            marks=xfail(reason="Missing implementation for np.gradient"),
-        ),
-        param(
-            do("dot", make_xrarray({"x": 10, "y": 5})),
-            True,
-            marks=xfail(reason="Missing implementation for np.einsum"),
-        ),
-        param(do("dropna", "x"), False, marks=xfail(reason="Coercion to dense")),
-        param(do("ffill", "x"), False, marks=xfail(reason="Coercion to dense")),
-        (do("fillna", 0), True),
-        param(
-            do("interp", coords={"x": np.arange(10) + 0.5}),
-            True,
-            marks=xfail(reason="Coercion to dense"),
-        ),
-        param(
-            do(
-                "interp_like",
-                make_xrarray(
-                    {"x": 10, "y": 5},
-                    coords={"x": np.arange(10) + 0.5, "y": np.arange(5) + 0.5},
-                ),
-            ),
-            True,
-            marks=xfail(reason="Indexing COO with more than one iterable index"),
-        ),
-        param(do("interpolate_na", "x"), True, marks=xfail(reason="Coercion to dense")),
-        param(
-            do("isin", [1, 2, 3]),
-            False,
-            marks=xfail(reason="Missing implementation for np.isin"),
-        ),
-        param(
-            do("item", (1, 1)),
-            False,
-            marks=xfail(reason="'COO' object has no attribute 'item'"),
-        ),
-        param(do("max"), False),
-        param(do("min"), False),
-        param(
-            do("median"),
-            False,
-            marks=xfail(reason="Missing implementation for np.nanmedian"),
-        ),
-        (do("notnull"), True),
-        (do("pipe", np.sum, axis=1), True),
-        (do("prod"), False),
-        param(
-            do("quantile", q=0.5),
-            False,
-            marks=xfail(reason="Missing implementation for np.nanpercentile"),
-        ),
-        param(
-            do("rank", "x"),
-            False,
-            marks=xfail(reason="Only implemented for NumPy arrays (via bottleneck)"),
-        ),
-        param(
-            do("reduce", np.sum, dim="x"),
-            False,
-            marks=xfail(reason="Coercion to dense"),
-        ),
-        param(
-            do(
-                "reindex_like",
-                make_xrarray(
-                    {"x": 10, "y": 5},
-                    coords={"x": np.arange(10) + 0.5, "y": np.arange(5) + 0.5},
-                ),
-            ),
-            True,
-            marks=xfail(reason="Indexing COO with more than one iterable index"),
-        ),
-        (do("roll", x=2, roll_coords=True), True),
-        param(
-            do("sel", x=[0, 1, 2], y=[2, 3]),
-            True,
-            marks=xfail(reason="Indexing COO with more than one iterable index"),
-        ),
-        param(
-            do("std"), False, marks=xfail(reason="Missing implementation for np.nanstd")
-        ),
-        (do("sum"), False),
-        param(
-            do("var"), False, marks=xfail(reason="Missing implementation for np.nanvar")
-        ),
-        param(
-            do("where", make_xrarray({"x": 10, "y": 5}) > 0.5),
-            False,
-            marks=xfail(reason="Conversion of dense to sparse when using sparse mask"),
-        ),
-    ],
-    ids=repr,
-)
-def test_dataarray_method(func, sparse_output):
-    arr_s = make_xrarray(
-        {"x": 10, "y": 5}, coords={"x": np.arange(10), "y": np.arange(5)}
-    )
-    arr_d = xr.DataArray(arr_s.data.todense(), coords=arr_s.coords, dims=arr_s.dims)
-    ret_s = func(arr_s)
-    ret_d = func(arr_d)
-
-    if sparse_output:
-        assert isinstance(ret_s.data, sparse.SparseArray)
-        assert np.allclose(ret_s.data.todense(), ret_d.data, equal_nan=True)
-    else:
-        assert np.allclose(ret_s, ret_d, equal_nan=True)
-
-
-@pytest.mark.parametrize(
-    "func,sparse_output",
-    [
-        (do("squeeze"), True),
-        param(
-            do("searchsorted", [1, 2, 3]),
-            False,
-            marks=xfail(reason="'COO' object has no attribute 'searchsorted'"),
-        ),
-    ],
-)
-def test_datarray_1d_method(func, sparse_output):
-    arr_s = make_xrarray({"x": 10}, coords={"x": np.arange(10)})
-    arr_d = xr.DataArray(arr_s.data.todense(), coords=arr_s.coords, dims=arr_s.dims)
-    ret_s = func(arr_s)
-    ret_d = func(arr_d)
-
-    if sparse_output:
-        assert isinstance(ret_s.data, sparse.SparseArray)
-        assert np.allclose(ret_s.data.todense(), ret_d.data, equal_nan=True)
-    else:
-        assert np.allclose(ret_s, ret_d, equal_nan=True)
-
-
-class TestSparseDataArrayAndDataset:
-    @pytest.fixture(autouse=True)
-    def setUp(self):
-        self.sp_ar = sparse.random((4, 6), random_state=0, density=0.5)
-        self.sp_xr = xr.DataArray(
-            self.sp_ar, coords={"x": range(4)}, dims=("x", "y"), name="foo"
-        )
-        self.ds_ar = self.sp_ar.todense()
-        self.ds_xr = xr.DataArray(
-            self.ds_ar, coords={"x": range(4)}, dims=("x", "y"), name="foo"
-        )
-
-    def test_to_dataset_roundtrip(self):
-        x = self.sp_xr
-        assert_equal(x, x.to_dataset("x").to_array("x"))
-
-    def test_align(self):
-        a1 = xr.DataArray(
-            sparse.COO.from_numpy(np.arange(4)),
-            dims=["x"],
-            coords={"x": ["a", "b", "c", "d"]},
-        )
-        b1 = xr.DataArray(
-            sparse.COO.from_numpy(np.arange(4)),
-            dims=["x"],
-            coords={"x": ["a", "b", "d", "e"]},
-        )
-        a2, b2 = xr.align(a1, b1, join="inner")
-        assert isinstance(a2.data, sparse.SparseArray)
-        assert isinstance(b2.data, sparse.SparseArray)
-        assert np.all(a2.coords["x"].data == ["a", "b", "d"])
-        assert np.all(b2.coords["x"].data == ["a", "b", "d"])
-
-    @pytest.mark.xfail(
-        reason="COO objects currently do not accept more than one "
-        "iterable index at a time"
-    )
-    def test_align_2d(self):
-        A1 = xr.DataArray(
-            self.sp_ar,
-            dims=["x", "y"],
-            coords={
-                "x": np.arange(self.sp_ar.shape[0]),
-                "y": np.arange(self.sp_ar.shape[1]),
-            },
-        )
-
-        A2 = xr.DataArray(
-            self.sp_ar,
-            dims=["x", "y"],
-            coords={
-                "x": np.arange(1, self.sp_ar.shape[0] + 1),
-                "y": np.arange(1, self.sp_ar.shape[1] + 1),
-            },
-        )
-
-        B1, B2 = xr.align(A1, A2, join="inner")
-        assert np.all(B1.coords["x"] == np.arange(1, self.sp_ar.shape[0]))
-        assert np.all(B1.coords["y"] == np.arange(1, self.sp_ar.shape[0]))
-        assert np.all(B1.coords["x"] == B2.coords["x"])
-        assert np.all(B1.coords["y"] == B2.coords["y"])
-
-    def test_align_outer(self):
-        a1 = xr.DataArray(
-            sparse.COO.from_numpy(np.arange(4)),
-            dims=["x"],
-            coords={"x": ["a", "b", "c", "d"]},
-        )
-        b1 = xr.DataArray(
-            sparse.COO.from_numpy(np.arange(4)),
-            dims=["x"],
-            coords={"x": ["a", "b", "d", "e"]},
-        )
-        a2, b2 = xr.align(a1, b1, join="outer")
-        assert isinstance(a2.data, sparse.SparseArray)
-        assert isinstance(b2.data, sparse.SparseArray)
-        assert np.all(a2.coords["x"].data == ["a", "b", "c", "d", "e"])
-        assert np.all(b2.coords["x"].data == ["a", "b", "c", "d", "e"])
-
-    def test_concat(self):
-        ds1 = xr.Dataset(data_vars={"d": self.sp_xr})
-        ds2 = xr.Dataset(data_vars={"d": self.sp_xr})
-        ds3 = xr.Dataset(data_vars={"d": self.sp_xr})
-        out = xr.concat([ds1, ds2, ds3], dim="x")
-        assert_sparse_equal(
-            out["d"].data,
-            sparse.concatenate([self.sp_ar, self.sp_ar, self.sp_ar], axis=0),
-        )
-
-        out = xr.concat([self.sp_xr, self.sp_xr, self.sp_xr], dim="y")
-        assert_sparse_equal(
-            out.data, sparse.concatenate([self.sp_ar, self.sp_ar, self.sp_ar], axis=1)
-        )
-
-    def test_stack(self):
-        arr = make_xrarray({"w": 2, "x": 3, "y": 4})
-        stacked = arr.stack(z=("x", "y"))
-
-        z = pd.MultiIndex.from_product([np.arange(3), np.arange(4)], names=["x", "y"])
-
-        expected = xr.DataArray(
-            arr.data.reshape((2, -1)), {"w": [0, 1], "z": z}, dims=["w", "z"]
-        )
-
-        assert_equal(expected, stacked)
-
-        roundtripped = stacked.unstack()
-        assert arr.identical(roundtripped)
-
-    @pytest.mark.filterwarnings("ignore::PendingDeprecationWarning")
-    def test_ufuncs(self):
-        x = self.sp_xr
-        assert_equal(np.sin(x), xu.sin(x))
-
-    def test_dataarray_repr(self):
-        a = xr.DataArray(
-            sparse.COO.from_numpy(np.ones(4)),
-            dims=["x"],
-            coords={"y": ("x", sparse.COO.from_numpy(np.arange(4, dtype="i8")))},
-        )
-        expected = dedent(
-            """\
-            <xarray.DataArray (x: 4)>
-            <COO: shape=(4,), dtype=float64, nnz=4, fill_value=0.0>
-            Coordinates:
-                y        (x) int64 <COO: nnz=3, fill_value=0>
-            Dimensions without coordinates: x"""
-        )
-        assert expected == repr(a)
-
-    def test_dataset_repr(self):
-        ds = xr.Dataset(
-            data_vars={"a": ("x", sparse.COO.from_numpy(np.ones(4)))},
-            coords={"y": ("x", sparse.COO.from_numpy(np.arange(4, dtype="i8")))},
-        )
-        expected = dedent(
-            """\
-            <xarray.Dataset>
-            Dimensions:  (x: 4)
-            Coordinates:
-                y        (x) int64 <COO: nnz=3, fill_value=0>
-            Dimensions without coordinates: x
-            Data variables:
-                a        (x) float64 <COO: nnz=4, fill_value=0.0>"""
-        )
-        assert expected == repr(ds)
-
-    def test_sparse_dask_dataset_repr(self):
-        pytest.importorskip("dask", minversion="2.0")
-        ds = xr.Dataset(
-            data_vars={"a": ("x", sparse.COO.from_numpy(np.ones(4)))}
-        ).chunk()
-        expected = dedent(
-            """\
-            <xarray.Dataset>
-            Dimensions:  (x: 4)
-            Dimensions without coordinates: x
-            Data variables:
-                a        (x) float64 dask.array<chunksize=(4,), meta=sparse.COO>"""
-        )
-        assert expected == repr(ds)
-
-    def test_dataarray_pickle(self):
-        a1 = xr.DataArray(
-            sparse.COO.from_numpy(np.ones(4)),
-            dims=["x"],
-            coords={"y": ("x", sparse.COO.from_numpy(np.arange(4)))},
-        )
-        a2 = pickle.loads(pickle.dumps(a1))
-        assert_identical(a1, a2)
-
-    def test_dataset_pickle(self):
-        ds1 = xr.Dataset(
-            data_vars={"a": ("x", sparse.COO.from_numpy(np.ones(4)))},
-            coords={"y": ("x", sparse.COO.from_numpy(np.arange(4)))},
-        )
-        ds2 = pickle.loads(pickle.dumps(ds1))
-        assert_identical(ds1, ds2)
-
-    def test_coarsen(self):
-        a1 = self.ds_xr
-        a2 = self.sp_xr
-        m1 = a1.coarsen(x=2, boundary="trim").mean()
-        m2 = a2.coarsen(x=2, boundary="trim").mean()
-
-        assert isinstance(m2.data, sparse.SparseArray)
-        assert np.allclose(m1.data, m2.data.todense())
-
-    @pytest.mark.xfail(reason="No implementation of np.pad")
-    def test_rolling(self):
-        a1 = self.ds_xr
-        a2 = self.sp_xr
-        m1 = a1.rolling(x=2, center=True).mean()
-        m2 = a2.rolling(x=2, center=True).mean()
-
-        assert isinstance(m2.data, sparse.SparseArray)
-        assert np.allclose(m1.data, m2.data.todense())
-
-    @pytest.mark.xfail(reason="Coercion to dense")
-    def test_rolling_exp(self):
-        a1 = self.ds_xr
-        a2 = self.sp_xr
-        m1 = a1.rolling_exp(x=2, center=True).mean()
-        m2 = a2.rolling_exp(x=2, center=True).mean()
-
-        assert isinstance(m2.data, sparse.SparseArray)
-        assert np.allclose(m1.data, m2.data.todense())
-
-    @pytest.mark.xfail(reason="No implementation of np.einsum")
-    def test_dot(self):
-        a1 = self.xp_xr.dot(self.xp_xr[0])
-        a2 = self.sp_ar.dot(self.sp_ar[0])
-        assert_equal(a1, a2)
-
-    @pytest.mark.xfail(reason="Groupby reductions produce dense output")
-    def test_groupby(self):
-        x1 = self.ds_xr
-        x2 = self.sp_xr
-        m1 = x1.groupby("x").mean(...)
-        m2 = x2.groupby("x").mean(...)
-        assert isinstance(m2.data, sparse.SparseArray)
-        assert np.allclose(m1.data, m2.data.todense())
-
-    @pytest.mark.xfail(reason="Groupby reductions produce dense output")
-    def test_groupby_first(self):
-        x = self.sp_xr.copy()
-        x.coords["ab"] = ("x", ["a", "a", "b", "b"])
-        x.groupby("ab").first()
-        x.groupby("ab").first(skipna=False)
-
-    @pytest.mark.xfail(reason="Groupby reductions produce dense output")
-    def test_groupby_bins(self):
-        x1 = self.ds_xr
-        x2 = self.sp_xr
-        m1 = x1.groupby_bins("x", bins=[0, 3, 7, 10]).sum(...)
-        m2 = x2.groupby_bins("x", bins=[0, 3, 7, 10]).sum(...)
-        assert isinstance(m2.data, sparse.SparseArray)
-        assert np.allclose(m1.data, m2.data.todense())
-
-    @pytest.mark.xfail(reason="Resample produces dense output")
-    def test_resample(self):
-        t1 = xr.DataArray(
-            np.linspace(0, 11, num=12),
-            coords=[
-                pd.date_range("15/12/1999", periods=12, freq=pd.DateOffset(months=1))
-            ],
-            dims="time",
-        )
-        t2 = t1.copy()
-        t2.data = sparse.COO(t2.data)
-        m1 = t1.resample(time="QS-DEC").mean()
-        m2 = t2.resample(time="QS-DEC").mean()
-        assert isinstance(m2.data, sparse.SparseArray)
-        assert np.allclose(m1.data, m2.data.todense())
-
-    @pytest.mark.xfail
-    def test_reindex(self):
-        x1 = self.ds_xr
-        x2 = self.sp_xr
-        for kwargs in [
-            {"x": [2, 3, 4]},
-            {"x": [1, 100, 2, 101, 3]},
-            {"x": [2.5, 3, 3.5], "y": [2, 2.5, 3]},
-        ]:
-            m1 = x1.reindex(**kwargs)
-            m2 = x2.reindex(**kwargs)
-            assert np.allclose(m1, m2, equal_nan=True)
-
-    @pytest.mark.xfail
-    def test_merge(self):
-        x = self.sp_xr
-        y = xr.merge([x, x.rename("bar")]).to_array()
-        assert isinstance(y, sparse.SparseArray)
-
-    @pytest.mark.xfail
-    def test_where(self):
-        a = np.arange(10)
-        cond = a > 3
-        xr.DataArray(a).where(cond)
-
-        s = sparse.COO.from_numpy(a)
-        cond = s > 3
-        xr.DataArray(s).where(cond)
-
-        x = xr.DataArray(s)
-        cond = x > 3
-        x.where(cond)
-
-
-class TestSparseCoords:
-    @pytest.mark.xfail(reason="Coercion of coords to dense")
-    def test_sparse_coords(self):
-        xr.DataArray(
-            sparse.COO.from_numpy(np.arange(4)),
-            dims=["x"],
-            coords={"x": sparse.COO.from_numpy([1, 2, 3, 4])},
-        )
-
-
-@requires_dask
-def test_chunk():
-    s = sparse.COO.from_numpy(np.array([0, 0, 1, 2]))
-    a = DataArray(s)
-    ac = a.chunk(2)
-    assert ac.chunks == ((2, 2),)
-    assert isinstance(ac.data._meta, sparse.COO)
-    assert_identical(ac, a)
-
-    ds = a.to_dataset(name="a")
-    dsc = ds.chunk(2)
-    assert dsc.chunks == {"dim_0": (2, 2)}
-    assert_identical(dsc, ds)
-
-
-@requires_dask
-def test_dask_token():
-    import dask
-
-    s = sparse.COO.from_numpy(np.array([0, 0, 1, 2]))
-
-    # https://github.com/pydata/sparse/issues/300
-    s.__dask_tokenize__ = lambda: dask.base.normalize_token(s.__dict__)
-
-    a = DataArray(s)
-    t1 = dask.base.tokenize(a)
-    t2 = dask.base.tokenize(a)
-    t3 = dask.base.tokenize(a + 1)
-    assert t1 == t2
-    assert t3 != t2
-    assert isinstance(a.data, sparse.COO)
-
-    ac = a.chunk(2)
-    t4 = dask.base.tokenize(ac)
-    t5 = dask.base.tokenize(ac + 1)
-    assert t4 != t5
-    assert isinstance(ac.data._meta, sparse.COO)
-
-
-@requires_dask
-def test_apply_ufunc_meta_to_blockwise():
-    da = xr.DataArray(np.zeros((2, 3)), dims=["x", "y"]).chunk({"x": 2, "y": 1})
-    sparse_meta = sparse.COO.from_numpy(np.zeros((0, 0)))
-
-    # if dask computed meta, it would be np.ndarray
-    expected = xr.apply_ufunc(
-        lambda x: x, da, dask="parallelized", output_dtypes=[da.dtype], meta=sparse_meta
-    ).data._meta
-
-    assert_sparse_equal(expected, sparse_meta)

From de8ee28ed5c52f36a91237c43f4b7987ab9d420f Mon Sep 17 00:00:00 2001
From: Aleksandar Jelenak <ajelenak@hdfgroup.org>
Date: Thu, 20 Aug 2020 13:47:14 -0500
Subject: [PATCH 6/7] Add minimum zarr version requirement in docstring

---
 xarray/core/dataset.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/xarray/core/dataset.py b/xarray/core/dataset.py
index 2ad856c28e5..41d563fedd6 100644
--- a/xarray/core/dataset.py
+++ b/xarray/core/dataset.py
@@ -1592,6 +1592,7 @@ def to_zarr(
             Store or path to directory in file system.
         chunk_store : MutableMapping, str or Path, optional
             Store or path to directory in file system only for Zarr array chunks.
+            Requires zarr-python v2.4.0 or later.
         mode : {"w", "w-", "a", None}, optional
             Persistence mode: "w" means create (overwrite if exists);
             "w-" means create (fail if exists);

From 13022fc5c284a285aad29bbb5dbc5fa7d8783545 Mon Sep 17 00:00:00 2001
From: Deepak Cherian <dcherian@users.noreply.github.com>
Date: Tue, 25 Aug 2020 17:37:31 +0000
Subject: [PATCH 7/7] Update xarray/tests/test_backends.py

---
 xarray/tests/test_backends.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/xarray/tests/test_backends.py b/xarray/tests/test_backends.py
index 709000e3137..1173fed0055 100644
--- a/xarray/tests/test_backends.py
+++ b/xarray/tests/test_backends.py
@@ -1589,7 +1589,6 @@ def test_auto_chunk(self):
                 # only index variables should be in memory
                 assert v._in_memory == (k in actual.dims)
                 # chunk size should be the same as original
-
                 assert v.chunks == original[k].chunks
 
     @requires_dask