bluesky · genematx · Mar 3, 2026 · Mar 4, 2026 · Mar 4, 2026 · Mar 5, 2026
diff --git a/.gitignore b/.gitignore
@@ -36,6 +36,9 @@ nosetests.xml
 coverage.xml
 cover/*
 
+# hypothesis
+.hypothesis/
+
 # PyBuilder
 target/
 

diff --git a/pixi.toml b/pixi.toml
@@ -51,6 +51,7 @@ pyarrow-all = ">=14.0.1"  # includes fix to CVE 2023-47248
 aiohttp = "*"
 coverage = "*"
 flake8 = "*"
+hypothesis = "*"
 ipython = "*"
 ldap3 = "*"
 matplotlib = "*"

diff --git a/pyproject.toml b/pyproject.toml
@@ -77,6 +77,7 @@ all = [
     "h5netcdf",
     "h5py",
     "hdf5plugin",
+    "hypothesis",
     "jinja2",
     "jmespath",
     "lz4",
@@ -263,6 +264,7 @@ test = [
     "aiohttp",
     "coverage",
     "flake8",
+    "hypothesis",
     "importlib_resources;python_version < \"3.9\"",
     "ipython",
     "ldap3",

diff --git a/tests/test_array.py b/tests/test_array.py
@@ -7,11 +7,13 @@
 import httpx
 import numpy
 import pytest
-from starlette.status import HTTP_400_BAD_REQUEST, HTTP_406_NOT_ACCEPTABLE
+from starlette.status import HTTP_406_NOT_ACCEPTABLE, HTTP_422_UNPROCESSABLE_CONTENT
 
 from tiled.adapters.array import ArrayAdapter
 from tiled.adapters.mapping import MapAdapter
-from tiled.client import Context, from_context
+from tiled.client import Context, from_context, record_history
+from tiled.client.array import ArrayClient
+from tiled.ndslice import NDSlice
 from tiled.serialization.array import as_buffer
 from tiled.server.app import build_app
 
@@ -43,6 +45,10 @@
 cube_cases = {
     "tiny_cube": numpy.random.random((10, 10, 10)),
     "tiny_hypercube": numpy.random.random((10, 10, 10, 10, 10)),
+    "chunked": dask.array.from_array(
+        numpy.arange(1_200_000, dtype="uint64").reshape((10, 300, 400)),
+        chunks=(1, 300, 200),
+    ),
 }
 cube_tree = MapAdapter({k: ArrayAdapter.from_array(v) for k, v in cube_cases.items()})
 inf_tree = MapAdapter(
@@ -146,12 +152,16 @@ def strict_parse_constant(c):
 
 
 def test_block_validation(context):
-    "Verify that block must be fully specified."
+    "Verify that block is correctly specified."
     client = from_context(context, "dask")["cube"]["tiny_cube"]
     block_url = httpx.URL(client.item["links"]["block"])
     # Malformed because it has only 2 dimensions, not 3.
     malformed_block_url = block_url.copy_with(params={"block": "0,0"})
-    with fail_with_status_code(HTTP_400_BAD_REQUEST):
+    with fail_with_status_code(HTTP_422_UNPROCESSABLE_CONTENT):
+        client.context.http_client.get(malformed_block_url).raise_for_status()
+    # Malformed because it has 4 dimensions, not 3.
+    malformed_block_url = block_url.copy_with(params={"block": "0,0,0,0"})
+    with fail_with_status_code(HTTP_422_UNPROCESSABLE_CONTENT):
         client.context.http_client.get(malformed_block_url).raise_for_status()
 
 
@@ -166,7 +176,59 @@ def test_dask(context):
 def test_array_format_shape_from_cube(context):
     client = from_context(context)["cube"]
     with fail_with_status_code(HTTP_406_NOT_ACCEPTABLE):
-        hyper_cube = client["tiny_hypercube"].export("test.png")  # noqa: F841
+        client["tiny_hypercube"].export("test.png")
+
+
+@pytest.mark.parametrize(
+    "bytesize_limit, num_gets_expected",
+    [
+        (None, 1),  # Default, Entire array fits in one response
+        (300 * 400 * 8, 10),  # Each frame fits in one response
+        (300 * 400 * 8 - 1, 20),  # Just under the limit, each frame is split in half
+        (300 * 400 * 16, 5),  # Two frames fit in one response
+        (300 * 100 * 8, 40),  # Each chunk is split in half
+    ],
+)
+def test_request_chunking(context, bytesize_limit, num_gets_expected, monkeypatch):
+    # Try reading a (10, 300, 400) array with (1, 300, 200) chunks and count requests
+    bytesize_limit = bytesize_limit or ArrayClient.RESPONSE_BYTESIZE_LIMIT
+    monkeypatch.setattr(ArrayClient, "RESPONSE_BYTESIZE_LIMIT", bytesize_limit)
+    client = from_context(context)["cube/chunked"]
+    with record_history() as h:
+        arr = client.read()
+    num_gets = sum(1 for entry in h.requests if entry.method == "GET")
+    assert num_gets == num_gets_expected
+    assert all("/array/full" in req.url.path for req in h.requests)
+    numpy.testing.assert_equal(arr, cube_cases["chunked"])
+
+
+def test_request_slicing(context):
+    # One slice that requires data from all chunks
+    client = from_context(context)["cube/chunked"]
+    expected = cube_cases["chunked"][:, 42, 100:300]
+    with record_history() as h:
+        actual = client[:, 42, 100:300]
+    assert len(h.requests) == 1
+    numpy.testing.assert_equal(actual, expected)
+
+
+def test_request_empty_slice(context):
+    # When reading an entire array, `slice=` should not be requested
+    client = from_context(context)["cube/chunked"]
+    with record_history() as h:
+        client.read()
+        client.read(slice=None)
+        client.read(slice=())
+        client.read(slice=Ellipsis)
+        client.read(slice=NDSlice())
+        client[...]
+        client[()]
+        client[:, :, :]
+        client[:]
+        client[:, ..., :]
+    assert len(h.requests) == 10
+    assert all("expected_shape" in req.url.params for req in h.requests)
+    assert all("slice" not in req.url.params for req in h.requests)
 
 
 def test_array_interface(context):

diff --git a/tests/test_hdf5.py b/tests/test_hdf5.py
@@ -131,6 +131,8 @@ def test_from_file(example_file, buffer):
 @pytest.mark.parametrize("key", ["d", "e", "f", "g", "h", "i"])
 def test_from_file_with_empty_data(example_file_with_empty_data, buffer, key):
     """Serve a single HDF5 file at top level."""
+    if key == "h":
+        pytest.xfail("WIP: account for empty string datasets.")
     h5py = pytest.importorskip("h5py")
     tree = HDF5Adapter.from_uris(example_file_with_empty_data)
     with Context.from_app(build_app(tree)) as context:
@@ -164,6 +166,7 @@ def test_from_file_with_scalars(example_file_with_scalars, buffer, key: str, num
 @pytest.mark.filterwarnings("ignore: The dataset")
 def test_from_file_with_vlen_str_dataset(example_file_with_vlen_str_in_dataset, buffer):
     """Serve a single HDF5 file at top level."""
+    pytest.xfail("WIP: account for vlen str datasets.")
     h5py = pytest.importorskip("h5py")
     tree = HDF5Adapter.from_uris(example_file_with_vlen_str_in_dataset)
     with pytest.warns(UserWarning):

diff --git a/tests/test_slicer.py b/tests/test_slicer.py
@@ -116,7 +116,7 @@ def test_slicer(slice: str):
     """
     Test the slicer function
     """
-    assert NDSlice.from_query(slice) == reference_slice_(slice)
+    assert NDSlice.from_numpy_str(slice) == reference_slice_(slice)
 
 
 @pytest.mark.parametrize("slice", slice_typo_data + slice_missing_data)
@@ -125,7 +125,7 @@ def test_slicer_typo_data(slice: str):
     Test the slicer function with invalid input
     """
     with pytest.raises(ValueError):
-        _ = NDSlice.from_query(slice)
+        _ = NDSlice.from_numpy_str(slice)
 
 
 @pytest.mark.parametrize("slice", slice_malicious_data)
@@ -134,7 +134,7 @@ def test_slicer_malicious_exec(slice: str):
     Test the slicer function with 'malicious' input
     """
     with pytest.raises(ValueError):
-        _ = NDSlice.from_query(slice)
+        _ = NDSlice.from_numpy_str(slice)
 
 
 @pytest.mark.parametrize("slice_", slice_typo_data + slice_malicious_data)

diff --git a/tests/test_tiff.py b/tests/test_tiff.py
@@ -71,7 +71,6 @@ def test_tiff_sequence(client, slice_input, correct_shape):
     assert arr.shape == correct_shape
 
 
-@pytest.mark.filterwarnings("ignore: Forcefully reshaping ")
 @pytest.mark.parametrize(
     "slice_input, correct_shape",
     [

diff --git a/tests/test_utils.py b/tests/test_utils.py
@@ -1,7 +1,14 @@
+import math
 from pathlib import Path
 
+import dask.array as da
+import numpy as np
 import pytest
+from hypothesis import given, settings
+from hypothesis import strategies as st
 
+from tiled.client.utils import slices_to_dask_chunks, split_1d, split_nd_slice
+from tiled.ndslice import NDSlice
 from tiled.utils import (
     CachingMap,
     DictView,
@@ -365,3 +372,190 @@ def test_parse_invalid_mimetype():
     with pytest.raises(ValueError):
         # Parameter does not have form 'key=value'
         assert parse_mimetype("text/csv;oops")
+
+
+@given(data=st.data(), max_len=st.integers(1, 50))
+def test_split_1d(data, max_len):
+    # Generate start and stop values
+    start = data.draw(st.integers(0, 100), label="start")
+    stop = data.draw(st.integers(0, 100), label="stop")
+
+    # Check degenerate slice
+    if start == stop:
+        result = split_1d(start, stop, step=1, max_len=max_len, pref_splits=[])
+        assert result == [(start, stop)]
+        return
+
+    # Step must match slice direction
+    if stop > start:
+        step = data.draw(st.integers(1, 10), label="step")
+    elif stop < start:
+        step = data.draw(st.integers(-10, -1), label="step")
+
+    # Preferred splits strictly inside slice and unique
+    preferred_splits = data.draw(
+        st.lists(
+            st.integers(min(start, stop), max(start, stop) - 1),
+            unique=True,
+            max_size=10,
+        ),
+        label="preferred_splits",
+    )
+
+    result = split_1d(start, stop, step, max_len, preferred_splits)
+
+    # 1. Check that first and last boundaries match
+    assert result[0][0] == start
+    assert result[-1][1] == stop
+
+    # 2. Check contiguous intervals
+    for (_, a_stop), (b_start, _) in zip(result, result[1:]):
+        assert a_stop == b_start
+
+    # 3. Check grid alignment
+    for a, b in result:
+        assert (a - start) % step == 0
+        if b != stop:
+            assert (b - start) % step == 0
+
+    # 4. Check max length constraint
+    for a, b in result:
+        assert len(range(a, b, step)) <= max_len
+
+    # 5. Check step direction consistency
+    for a, b in result:
+        if step > 0:
+            assert b >= a
+        else:
+            assert b <= a
+
+    # 6. Check no degenerate intervals
+    for a, b in result:
+        assert a != b
+        assert len(range(a, b, step)) > 0
+
+
+@st.composite
+def nd_slice_strategy(draw):
+    ndim = draw(st.integers(1, 4))
+
+    starts = draw(st.lists(st.integers(0, 20), min_size=ndim, max_size=ndim))
+    lengths = draw(st.lists(st.integers(0, 20), min_size=ndim, max_size=ndim))
+    steps = draw(st.lists(st.integers(1, 5), min_size=ndim, max_size=ndim))
+    reversed = draw(st.lists(st.booleans(), min_size=ndim, max_size=ndim))
+
+    slices, shape = [], []
+
+    for start, length, step, rev in zip(starts, lengths, steps, reversed):
+        if length == 0:
+            # Singleton dimension, use an integer index
+            slices.append(start)
+            shape.append(start + 1)
+        else:
+            stop = start + length * step
+            if rev:
+                slices.append(slice(stop, start, -step))
+            else:
+                slices.append(slice(start, stop, step))
+            shape.append(stop)
+
+    shape = tuple(shape)
+
+    return NDSlice(*slices).expand_for_shape(shape), shape
+
+
+@st.composite
+def pref_split_strategy(draw, slices):
+    pref = []
+
+    for sl in slices:
+        if isinstance(sl, int):
+            pref.append([])  # No splits for singleton dimensions
+            continue
+
+        start, stop, step = sl.start, sl.stop, sl.step or 1
+        grid = list(range(start + step, stop, step))
+
+        if grid:
+            splits = draw(
+                st.lists(
+                    st.sampled_from(grid),
+                    unique=True,
+                    max_size=min(len(grid), 5),
+                )
+            )
+        else:
+            splits = []
+
+        pref.append(sorted(splits))
+
+    return pref
+
+
+@given(data=st.data(), max_size=st.sampled_from([1, 2, 3, 5, 50, 100, 200]))
+@settings(deadline=None)
+def test_split_nd_slice(data, max_size):
+    arr_slice, shape = data.draw(nd_slice_strategy(), label="nd_slice")
+
+    if math.prod(arr_slice.shape_after_slice(shape)) == 0:
+        # Skip degenerate case where slice results in empty array
+        return
+
+    pref_splits = data.draw(pref_split_strategy(arr_slice), label="pref_splits")
+    arr = np.arange(math.prod(shape)).reshape(shape)
+    slices = split_nd_slice(arr_slice, max_size, pref_splits)
+
+    # 1. Check reconstruction of the original slice from the pieces
+    darr = da.Array(
+        name="test",
+        dask={
+            ("test",) + indx: (lambda x: arr[x], slc) for indx, slc in slices.items()
+        },
+        dtype=arr.dtype,
+        chunks=slices_to_dask_chunks(slices, shape),
+        shape=arr_slice.shape_after_slice(shape),
+    )
+    np.testing.assert_array_equal(darr.compute(), arr[arr_slice])
+
+    # 2. Check that each slice respects the max_size constraint
+    for slc in slices.values():
+        slc_shape = slc.shape_after_slice(shape)
+        assert math.prod(slc_shape) <= max_size
+
+
+@pytest.mark.parametrize(
+    "slice_dict,shape,expected",
+    [
+        ({(0, 0): NDSlice.from_numpy_str(":10, :5")}, (10, 5), ((10,), (5,))),
+        (
+            {
+                (0,): NDSlice.from_numpy_str(":10"),
+                (1,): NDSlice.from_numpy_str("10:30"),
+            },
+            (30,),
+            ((10, 20),),
+        ),
+        (
+            {
+                (0, 0): NDSlice.from_numpy_str(":10, :5"),
+                (0, 1): NDSlice.from_numpy_str(":10, 5:12"),
+                (1, 0): NDSlice.from_numpy_str("10:18, :5"),
+                (1, 1): NDSlice.from_numpy_str("10:18, 5:12"),
+            },
+            (18, 12),
+            ((10, 8), (5, 7)),
+        ),
+        (
+            {
+                (0, 0, 0): NDSlice.from_numpy_str(":2, :3, :4"),
+                (0, 0, 1): NDSlice.from_numpy_str(":2, :3, 4:9"),
+                (1, 0, 0): NDSlice.from_numpy_str("2:8, :3, :4"),
+                (1, 0, 1): NDSlice.from_numpy_str("2:8, :3, 4:9"),
+            },
+            (8, 3, 9),
+            ((2, 6), (3,), (4, 5)),
+        ),
+    ],
+)
+def test_dask_slices(slice_dict, shape, expected):
+    assert slices_to_dask_chunks(slice_dict, shape) == expected