dask · mrocklin · Jul 17, 2020 · Jul 17, 2020 · gforsyth · Jul 17, 2020
diff --git a/dask/array/core.py b/dask/array/core.py
@@ -2841,7 +2841,7 @@ def from_array(
 
 
 def from_zarr(
-    url, component=None, storage_options=None, chunks=None, name=None, **kwargs
+    url, component=None, storage_options=None, chunks="auto", name=None, **kwargs
 ):
     """Load array from the zarr storage format
 
@@ -2859,13 +2859,15 @@ def from_zarr(
     storage_options: dict
         Any additional parameters for the storage backend (ignored for local
         paths)
-    chunks: tuple of ints or tuples of ints
-        Passed to ``da.from_array``, allows setting the chunks on
-        initialisation, if the chunking scheme in the on-disc dataset is not
-        optimal for the calculations to follow.
+    chunks: str, int, tuple
+        Passed to ``da.from_array``.  See docstring there.
     name : str, optional
          An optional keyname for the array.  Defaults to hashing the input
     kwargs: passed to ``zarr.Array``.
+
+    See Also
+    --------
+    from_array
     """
     import zarr
 
@@ -2880,10 +2882,10 @@ def from_zarr(
     else:
         mapper = url
         z = zarr.Array(mapper, read_only=True, path=component, **kwargs)
-    chunks = chunks if chunks is not None else z.chunks
+
     if name is None:
         name = "from-zarr-" + tokenize(z, component, storage_options, chunks, **kwargs)
-    return from_array(z, chunks, name=name)
+    return from_array(z, chunks=chunks, name=name)
 
 
 def to_zarr(

diff --git a/dask/array/tests/test_array_core.py b/dask/array/tests/test_array_core.py
@@ -3857,7 +3857,22 @@ def test_zarr_roundtrip():
         a.to_zarr(d)
         a2 = da.from_zarr(d)
         assert_eq(a, a2)
-        assert a2.chunks == a.chunks
+
+
+def test_from_zarr_align_chunks():
+    zarr = pytest.importorskip("zarr")
+    a = zarr.ones(shape=(40000, 40000), chunks=(1000, 4))
+    x = da.from_zarr(a)
+    assert x.chunksize[0] % 1000 == 0
+    assert x.chunksize[1] % 4 == 0
+    assert x.chunksize[0] > x.chunksize[1]
+
+
+def test_from_zarr_auto_chunks():
+    zarr = pytest.importorskip("zarr")
+    a = zarr.array(range(100), chunks=(1,))
+    x = da.from_zarr(a)
+    assert x.npartitions < 100
 
 
 @pytest.mark.parametrize("compute", [False, True])
@@ -3868,7 +3883,6 @@ def test_zarr_return_stored(compute):
         a2 = a.to_zarr(d, compute=compute, return_stored=True)
         assert isinstance(a2, Array)
         assert_eq(a, a2, check_graph=False)
-        assert a2.chunks == a.chunks
 
 
 def test_to_zarr_delayed_creates_no_metadata():
@@ -3891,7 +3905,6 @@ def test_zarr_existing_array():
     a.to_zarr(z)
     a2 = da.from_zarr(z)
     assert_eq(a, a2)
-    assert a2.chunks == a.chunks
 
 
 def test_to_zarr_unknown_chunks_raises():
@@ -3921,7 +3934,6 @@ def test_zarr_pass_mapper():
         a.to_zarr(mapper)
         a2 = da.from_zarr(mapper)
         assert_eq(a, a2)
-        assert a2.chunks == a.chunks
 
 
 def test_zarr_group():
@@ -3942,7 +3954,6 @@ def test_zarr_group():
 
         a2 = da.from_zarr(d, component="test")
         assert_eq(a, a2)
-        assert a2.chunks == a.chunks
 
 
 @pytest.mark.parametrize(
@@ -3972,7 +3983,6 @@ def test_zarr_nocompute():
         dask.compute(out)
         a2 = da.from_zarr(d)
         assert_eq(a, a2)
-        assert a2.chunks == a.chunks
 
 
 def test_tiledb_roundtrip():

diff --git a/dask/tests/test_distributed.py b/dask/tests/test_distributed.py
@@ -175,7 +175,6 @@ def test_zarr_distributed_roundtrip():
         a.to_zarr(d)
         a2 = da.from_zarr(d)
         assert_eq(a, a2)
-        assert a2.chunks == a.chunks
 
 
 def test_zarr_in_memory_distributed_err(c):