diff --git a/.github/workflows/test.yml b/.github/workflows/test.yml
index c388ba31de..1c25dcb1f4 100644
--- a/.github/workflows/test.yml
+++ b/.github/workflows/test.yml
@@ -93,3 +93,22 @@ jobs:
     - name: Run Tests
       run: |
         hatch env run --env ${{ matrix.dependency-set }} run
+
+  test-complete:
+    name: Test complete
+
+    needs:
+      [
+        test,
+        test-upstream-and-min-deps,
+      ]
+    if: always()
+    runs-on: ubuntu-latest
+    steps:
+      - name: Check failure
+        if: |
+          contains(needs.*.result, 'failure') ||
+          contains(needs.*.result, 'cancelled')
+        run: exit 1
+      - name: Success
+        run: echo Success!
\ No newline at end of file
diff --git a/docs/contributing.rst b/docs/contributing.rst
index a65b3d104d..8038330239 100644
--- a/docs/contributing.rst
+++ b/docs/contributing.rst
@@ -92,12 +92,11 @@ the following::
     $ mkdir -p ~/pyenv/zarr-dev
     $ python -m venv ~/pyenv/zarr-dev
     $ source ~/pyenv/zarr-dev/bin/activate
-    $ pip install -r requirements_dev_minimal.txt -r requirements_dev_numpy.txt
-    $ pip install -e .[docs]
+    $ pip install -e .[test,docs]
 
 To verify that your development environment is working, you can run the unit tests::
 
-    $ python -m pytest -v zarr
+    $ python -m pytest -v tests
 
 Creating a branch
 ~~~~~~~~~~~~~~~~~
@@ -149,7 +148,7 @@ and invoke::
 Some tests require optional dependencies to be installed, otherwise
 the tests will be skipped. To install all optional dependencies, run::
 
-    $ pip install -r requirements_dev_optional.txt
+    $ pip install pytest-doctestplus
 
 To also run the doctests within docstrings (requires optional
 dependencies to be installed), run::
@@ -234,7 +233,7 @@ should run and pass as doctests under Python 3.8. To run doctests,
 activate your development environment, install optional requirements,
 and run::
 
-    $ python -m pytest -v --doctest-plus zarr
+    $ python -m pytest -v --doctest-plus tests
 
 Zarr uses Sphinx for documentation, hosted on readthedocs.org. Documentation is
 written in the RestructuredText markup language (.rst files) in the ``docs`` folder.
diff --git a/pyproject.toml b/pyproject.toml
index 3661fe3305..5f2d7569b9 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -341,6 +341,7 @@ ignore_errors = true
 
 [[tool.mypy.overrides]]
 module = [
+    "zarr.testing.stateful",  # lots of hypothesis decorator errors
     "tests.package_with_entrypoint.*",
     "tests.test_codecs.test_codecs",
     "tests.test_codecs.test_transpose",
diff --git a/src/zarr/core/chunk_grids.py b/src/zarr/core/chunk_grids.py
index afecc6824f..ea050e39ef 100644
--- a/src/zarr/core/chunk_grids.py
+++ b/src/zarr/core/chunk_grids.py
@@ -138,6 +138,9 @@ def normalize_chunks(chunks: Any, shape: tuple[int, ...], typesize: int) -> tupl
             s if c == -1 or c is None else int(c) for s, c in zip(shape, chunks, strict=False)
         )
 
+    if not all(isinstance(c, numbers.Integral) for c in chunks):
+        raise TypeError("non integer value in chunks")
+
     return tuple(int(c) for c in chunks)
 
 
diff --git a/src/zarr/testing/stateful.py b/src/zarr/testing/stateful.py
new file mode 100644
index 0000000000..cc0f220807
--- /dev/null
+++ b/src/zarr/testing/stateful.py
@@ -0,0 +1,437 @@
+import builtins
+from typing import Any
+
+import hypothesis.extra.numpy as npst
+import hypothesis.strategies as st
+import numpy as np
+from hypothesis import assume, note
+from hypothesis.stateful import (
+    RuleBasedStateMachine,
+    initialize,
+    invariant,
+    precondition,
+    rule,
+)
+from hypothesis.strategies import DataObject
+
+import zarr
+from zarr import Array
+from zarr.abc.store import Store
+from zarr.core.buffer import Buffer, BufferPrototype, cpu, default_buffer_prototype
+from zarr.core.sync import SyncMixin
+from zarr.storage import LocalStore, MemoryStore
+from zarr.testing.strategies import key_ranges, node_names, np_array_and_chunks, numpy_arrays
+from zarr.testing.strategies import keys as zarr_keys
+
+MAX_BINARY_SIZE = 100
+
+
+def split_prefix_name(path: str) -> tuple[str, str]:
+    split = path.rsplit("/", maxsplit=1)
+    if len(split) > 1:
+        prefix, name = split
+    else:
+        prefix = ""
+        (name,) = split
+    return prefix, name
+
+
+class ZarrHierarchyStateMachine(SyncMixin, RuleBasedStateMachine):
+    """
+    This state machine models operations that modify a zarr store's
+    hierarchy. That is, user actions that modify arrays/groups as well
+    as list operations. It is intended to be used by external stores, and
+    compares their results to a MemoryStore that is assumed to be perfect.
+    """
+
+    def __init__(self, store: Store) -> None:
+        super().__init__()
+
+        self.store = store
+
+        self.model = MemoryStore()
+        zarr.group(store=self.model)
+
+        # Track state of the hierarchy, these should contain fully qualified paths
+        self.all_groups: set[str] = set()
+        self.all_arrays: set[str] = set()
+
+    @initialize()
+    def init_store(self) -> None:
+        # This lets us reuse the fixture provided store.
+        self._sync(self.store.clear())
+        zarr.group(store=self.store)
+
+    def can_add(self, path: str) -> bool:
+        return path not in self.all_groups and path not in self.all_arrays
+
+    # -------------------- store operations -----------------------
+    @rule(name=node_names, data=st.data())
+    def add_group(self, name: str, data: DataObject) -> None:
+        if self.all_groups:
+            parent = data.draw(st.sampled_from(sorted(self.all_groups)), label="Group parent")
+        else:
+            parent = ""
+        path = f"{parent}/{name}".lstrip("/")
+        assume(self.can_add(path))
+        note(f"Adding group: path='{path}'")
+        self.all_groups.add(path)
+        zarr.group(store=self.store, path=path)
+        zarr.group(store=self.model, path=path)
+
+    @rule(
+        data=st.data(),
+        name=node_names,
+        array_and_chunks=np_array_and_chunks(arrays=numpy_arrays(zarr_formats=st.just(3))),
+    )
+    def add_array(
+        self,
+        data: DataObject,
+        name: str,
+        array_and_chunks: tuple[np.ndarray[Any, Any], tuple[int, ...]],
+    ) -> None:
+        array, chunks = array_and_chunks
+        fill_value = data.draw(npst.from_dtype(array.dtype))
+        if self.all_groups:
+            parent = data.draw(st.sampled_from(sorted(self.all_groups)), label="Array parent")
+        else:
+            parent = ""
+        # TODO: support creating deeper paths
+        # TODO: support overwriting potentially by just skipping `self.can_add`
+        path = f"{parent}/{name}".lstrip("/")
+        assume(self.can_add(path))
+        note(f"Adding array:  path='{path}'  shape={array.shape}  chunks={chunks}")
+        for store in [self.store, self.model]:
+            zarr.array(array, chunks=chunks, path=path, store=store, fill_value=fill_value)
+        self.all_arrays.add(path)
+
+    # @precondition(lambda self: bool(self.all_groups))
+    # @precondition(lambda self: bool(self.all_arrays))
+    # @rule(data=st.data())
+    # def move_array(self, data):
+    #     array_path = data.draw(st.sampled_from(self.all_arrays), label="Array move source")
+    #     to_group = data.draw(st.sampled_from(self.all_groups), label="Array move destination")
+
+    #     # fixme renaiming to self?
+    #     array_name = os.path.basename(array_path)
+    #     assume(self.model.can_add(to_group, array_name))
+    #     new_path = f"{to_group}/{array_name}".lstrip("/")
+    #     note(f"moving array '{array_path}' -> '{new_path}'")
+    #     self.model.rename(array_path, new_path)
+    #     self.repo.store.rename(array_path, new_path)
+
+    # @precondition(lambda self: len(self.all_groups) >= 2)
+    # @rule(data=st.data())
+    # def move_group(self, data):
+    #     from_group = data.draw(st.sampled_from(self.all_groups), label="Group move source")
+    #     to_group = data.draw(st.sampled_from(self.all_groups), label="Group move destination")
+    #     assume(not to_group.startswith(from_group))
+
+    #     from_group_name = os.path.basename(from_group)
+    #     assume(self.model.can_add(to_group, from_group_name))
+    #     # fixme renaiming to self?
+    #     new_path = f"{to_group}/{from_group_name}".lstrip("/")
+    #     note(f"moving group '{from_group}' -> '{new_path}'")
+    #     self.model.rename(from_group, new_path)
+    #     self.repo.store.rename(from_group, new_path)
+
+    @precondition(lambda self: len(self.all_arrays) >= 1)
+    @rule(data=st.data())
+    def delete_array_using_del(self, data: DataObject) -> None:
+        array_path = data.draw(
+            st.sampled_from(sorted(self.all_arrays)), label="Array deletion target"
+        )
+        prefix, array_name = split_prefix_name(array_path)
+        note(f"Deleting array '{array_path}' ({prefix=!r}, {array_name=!r}) using del")
+        for store in [self.model, self.store]:
+            group = zarr.open_group(path=prefix, store=store)
+            group[array_name]  # check that it exists
+            del group[array_name]
+        self.all_arrays.remove(array_path)
+
+    @precondition(lambda self: len(self.all_groups) >= 2)  # fixme don't delete root
+    @rule(data=st.data())
+    def delete_group_using_del(self, data: DataObject) -> None:
+        group_path = data.draw(
+            st.sampled_from(sorted(self.all_groups)), label="Group deletion target"
+        )
+        prefix, group_name = split_prefix_name(group_path)
+        note(f"Deleting group '{group_path=!r}', {prefix=!r}, {group_name=!r} using delete")
+        members = zarr.open_group(store=self.model, path=group_path).members(max_depth=None)
+        for _, obj in members:
+            if isinstance(obj, Array):
+                self.all_arrays.remove(obj.path)
+            else:
+                self.all_groups.remove(obj.path)
+        for store in [self.store, self.model]:
+            group = zarr.open_group(store=store, path=prefix)
+            group[group_name]  # check that it exists
+            del group[group_name]
+        if group_path != "/":
+            # The root group is always present
+            self.all_groups.remove(group_path)
+
+    # # --------------- assertions -----------------
+    # def check_group_arrays(self, group):
+    #     # note(f"Checking arrays of '{group}'")
+    #     g1 = self.model.get_group(group)
+    #     g2 = zarr.open_group(path=group, mode="r", store=self.repo.store)
+    #     model_arrays = sorted(g1.arrays(), key=itemgetter(0))
+    #     our_arrays = sorted(g2.arrays(), key=itemgetter(0))
+    #     for (n1, a1), (n2, a2) in zip_longest(model_arrays, our_arrays):
+    #         assert n1 == n2
+    #         assert_array_equal(a1, a2)
+
+    # def check_subgroups(self, group_path):
+    #     g1 = self.model.get_group(group_path)
+    #     g2 = zarr.open_group(path=group_path, mode="r", store=self.repo.store)
+    #     g1_children = [name for (name, _) in g1.groups()]
+    #     g2_children = [name for (name, _) in g2.groups()]
+    #     # note(f"Checking {len(g1_children)} subgroups of group '{group_path}'")
+    #     assert g1_children == g2_children
+
+    # def check_list_prefix_from_group(self, group):
+    #     prefix = f"meta/root/{group}"
+    #     model_list = sorted(self.model.list_prefix(prefix))
+    #     al_list = sorted(self.repo.store.list_prefix(prefix))
+    #     # note(f"Checking {len(model_list)} keys under '{prefix}'")
+    #     assert model_list == al_list
+
+    #     prefix = f"data/root/{group}"
+    #     model_list = sorted(self.model.list_prefix(prefix))
+    #     al_list = sorted(self.repo.store.list_prefix(prefix))
+    #     # note(f"Checking {len(model_list)} keys under '{prefix}'")
+    #     assert model_list == al_list
+
+    # @precondition(lambda self: self.model.is_persistent_session())
+    # @rule(data=st.data())
+    # def check_group_path(self, data):
+    #     t0 = time.time()
+    #     group = data.draw(st.sampled_from(self.all_groups))
+    #     self.check_list_prefix_from_group(group)
+    #     self.check_subgroups(group)
+    #     self.check_group_arrays(group)
+    #     t1 = time.time()
+    #     note(f"Checks took {t1 - t0} sec.")
+
+    @invariant()
+    def check_list_prefix_from_root(self) -> None:
+        model_list = self._sync_iter(self.model.list_prefix(""))
+        store_list = self._sync_iter(self.store.list_prefix(""))
+        note(f"Checking {len(model_list)} keys")
+        assert sorted(model_list) == sorted(store_list)
+
+
+class SyncStoreWrapper(zarr.core.sync.SyncMixin):
+    def __init__(self, store: Store) -> None:
+        """Synchronous Store wrapper
+
+        This class holds synchronous methods that map to async methods of Store classes.
+        The synchronous wrapper is needed because hypothesis' stateful testing infra does
+        not support asyncio so we redefine sync versions of the Store API.
+        https://github.com/HypothesisWorks/hypothesis/issues/3712#issuecomment-1668999041
+        """
+        self.store = store
+
+    @property
+    def read_only(self) -> bool:
+        return self.store.read_only
+
+    def set(self, key: str, data_buffer: Buffer) -> None:
+        return self._sync(self.store.set(key, data_buffer))
+
+    def list(self) -> builtins.list[str]:
+        return self._sync_iter(self.store.list())
+
+    def get(self, key: str, prototype: BufferPrototype) -> Buffer | None:
+        return self._sync(self.store.get(key, prototype=prototype))
+
+    def get_partial_values(
+        self, key_ranges: builtins.list[Any], prototype: BufferPrototype
+    ) -> builtins.list[Buffer | None]:
+        return self._sync(self.store.get_partial_values(prototype=prototype, key_ranges=key_ranges))
+
+    def delete(self, path: str) -> None:
+        return self._sync(self.store.delete(path))
+
+    def is_empty(self, prefix: str) -> bool:
+        return self._sync(self.store.is_empty(prefix=prefix))
+
+    def clear(self) -> None:
+        return self._sync(self.store.clear())
+
+    def exists(self, key: str) -> bool:
+        return self._sync(self.store.exists(key))
+
+    def list_dir(self, prefix: str) -> None:
+        raise NotImplementedError
+
+    def list_prefix(self, prefix: str) -> None:
+        raise NotImplementedError
+
+    def set_partial_values(self, key_start_values: Any) -> None:
+        raise NotImplementedError
+
+    @property
+    def supports_listing(self) -> bool:
+        return self.store.supports_listing
+
+    @property
+    def supports_partial_writes(self) -> bool:
+        return self.supports_partial_writes
+
+    @property
+    def supports_writes(self) -> bool:
+        return self.store.supports_writes
+
+
+class ZarrStoreStateMachine(RuleBasedStateMachine):
+    """ "
+    Zarr store state machine
+
+        This is a subclass of a Hypothesis RuleBasedStateMachine.
+        It is testing a framework to ensure that the state of a Zarr store matches
+        an expected state after a set of random operations. It contains a store
+        (currently, a Zarr MemoryStore) and a model, a simplified version of a
+        zarr store (in this case, a dict). It also contains rules which represent
+        actions that can be applied to a zarr store. Rules apply an action to both
+        the store and the model, and invariants assert that the state of the model
+        is equal to the state of the store. Hypothesis then generates sequences of
+        rules, running invariants after each rule. It raises an error if a sequence
+        produces discontinuity between state of the model and state of the store
+        (ie. an invariant is violated).
+        https://hypothesis.readthedocs.io/en/latest/stateful.html
+    """
+
+    def __init__(self, store: Store) -> None:
+        super().__init__()
+        self.model: dict[str, Buffer] = {}
+        self.store = SyncStoreWrapper(store)
+        self.prototype = default_buffer_prototype()
+
+    @initialize()
+    def init_store(self) -> None:
+        self.store.clear()
+
+    @rule(key=zarr_keys, data=st.binary(min_size=0, max_size=MAX_BINARY_SIZE))
+    def set(self, key: str, data: DataObject) -> None:
+        note(f"(set) Setting {key!r} with {data}")
+        assert not self.store.read_only
+        data_buf = cpu.Buffer.from_bytes(data)
+        self.store.set(key, data_buf)
+        self.model[key] = data_buf
+
+    @precondition(lambda self: len(self.model.keys()) > 0)
+    @rule(key=zarr_keys, data=st.data())
+    def get(self, key: str, data: DataObject) -> None:
+        key = data.draw(
+            st.sampled_from(sorted(self.model.keys()))
+        )  # hypothesis wants to sample from sorted list
+        note("(get)")
+        store_value = self.store.get(key, self.prototype)
+        # to bytes here necessary because data_buf set to model in set()
+        assert self.model[key] == store_value
+
+    @rule(key=zarr_keys, data=st.data())
+    def get_invalid_zarr_keys(self, key: str, data: DataObject) -> None:
+        note("(get_invalid)")
+        assume(key not in self.model)
+        assert self.store.get(key, self.prototype) is None
+
+    @precondition(lambda self: len(self.model.keys()) > 0)
+    @rule(data=st.data())
+    def get_partial_values(self, data: DataObject) -> None:
+        key_range = data.draw(
+            key_ranges(keys=st.sampled_from(sorted(self.model.keys())), max_size=MAX_BINARY_SIZE)
+        )
+        note(f"(get partial) {key_range=}")
+        obs_maybe = self.store.get_partial_values(key_range, self.prototype)
+        observed = []
+
+        for obs in obs_maybe:
+            assert obs is not None
+            observed.append(obs.to_bytes())
+
+        model_vals_ls = []
+
+        for key, byte_range in key_range:
+            start = byte_range[0] or 0
+            step = byte_range[1]
+            stop = start + step if step is not None else None
+            model_vals_ls.append(self.model[key][start:stop])
+
+        assert all(
+            obs == exp.to_bytes() for obs, exp in zip(observed, model_vals_ls, strict=True)
+        ), (
+            observed,
+            model_vals_ls,
+        )
+
+    @precondition(lambda self: len(self.model.keys()) > 0)
+    @rule(data=st.data())
+    def delete(self, data: DataObject) -> None:
+        key = data.draw(st.sampled_from(sorted(self.model.keys())))
+        note(f"(delete) Deleting {key=}")
+
+        self.store.delete(key)
+        del self.model[key]
+
+    @rule()
+    def clear(self) -> None:
+        assert not self.store.read_only
+        note("(clear)")
+        self.store.clear()
+        self.model.clear()
+
+        assert self.store.is_empty("")
+
+        assert len(self.model.keys()) == len(list(self.store.list())) == 0
+
+    @rule()
+    # Local store can be non-empty when there are subdirectories but no files
+    @precondition(lambda self: not isinstance(self.store.store, LocalStore))
+    def is_empty(self) -> None:
+        note("(is_empty)")
+
+        # make sure they either both are or both aren't empty (same state)
+        assert self.store.is_empty("") == (not self.model)
+
+    @rule(key=zarr_keys)
+    def exists(self, key: str) -> None:
+        note("(exists)")
+
+        assert self.store.exists(key) == (key in self.model)
+
+    @invariant()
+    def check_paths_equal(self) -> None:
+        note("Checking that paths are equal")
+        paths = sorted(self.store.list())
+
+        assert sorted(self.model.keys()) == paths
+
+    @invariant()
+    def check_vals_equal(self) -> None:
+        note("Checking values equal")
+        for key, val in self.model.items():
+            store_item = self.store.get(key, self.prototype)
+            assert val == store_item
+
+    @invariant()
+    def check_num_zarr_keys_equal(self) -> None:
+        note("check num zarr_keys equal")
+
+        assert len(self.model) == len(list(self.store.list()))
+
+    @invariant()
+    def check_zarr_keys(self) -> None:
+        keys = list(self.store.list())
+
+        if not keys:
+            assert self.store.is_empty("") is True
+
+        else:
+            assert self.store.is_empty("") is False
+
+            for key in keys:
+                assert self.store.exists(key) is True
+        note("checking keys / exists / empty")
diff --git a/tests/test_api.py b/tests/test_api.py
index c7fc88241f..11977e8e32 100644
--- a/tests/test_api.py
+++ b/tests/test_api.py
@@ -47,6 +47,14 @@ def test_create_array(memory_store: Store) -> None:
     assert z.shape == (400,)
     assert z.chunks == (40,)
 
+    # create array with float shape
+    with pytest.raises(TypeError):
+        z = create(shape=(400.5, 100), store=store, overwrite=True)
+
+    # create array with float chunk shape
+    with pytest.raises(TypeError):
+        z = create(shape=(400, 100), chunks=(16, 16.5), store=store, overwrite=True)
+
 
 @pytest.mark.parametrize("path", ["foo", "/", "/foo", "///foo/bar"])
 @pytest.mark.parametrize("node_type", ["array", "group"])
diff --git a/tests/test_store/test_stateful.py b/tests/test_store/test_stateful.py
new file mode 100644
index 0000000000..ae10ca8d79
--- /dev/null
+++ b/tests/test_store/test_stateful.py
@@ -0,0 +1,33 @@
+# Stateful tests for arbitrary Zarr stores.
+import pytest
+from hypothesis.stateful import (
+    Settings,
+    run_state_machine_as_test,
+)
+
+from zarr.abc.store import Store
+from zarr.storage import LocalStore, MemoryStore, ZipStore
+from zarr.testing.stateful import ZarrHierarchyStateMachine, ZarrStoreStateMachine
+
+
+def test_zarr_hierarchy(sync_store: Store):
+    def mk_test_instance_sync() -> ZarrHierarchyStateMachine:
+        return ZarrHierarchyStateMachine(sync_store)
+
+    if isinstance(sync_store, ZipStore):
+        pytest.skip(reason="ZipStore does not support delete")
+    if isinstance(sync_store, MemoryStore):
+        run_state_machine_as_test(
+            mk_test_instance_sync, settings=Settings(report_multiple_bugs=False)
+        )
+
+
+def test_zarr_store(sync_store: Store) -> None:
+    def mk_test_instance_sync() -> None:
+        return ZarrStoreStateMachine(sync_store)
+
+    if isinstance(sync_store, ZipStore):
+        pytest.skip(reason="ZipStore does not support delete")
+    if isinstance(sync_store, LocalStore):
+        pytest.skip(reason="This test has errors")
+    run_state_machine_as_test(mk_test_instance_sync, settings=Settings(report_multiple_bugs=True))
diff --git a/tests/test_store/test_stateful_hierarchy.py b/tests/test_store/test_stateful_hierarchy.py
deleted file mode 100644
index 844e1227da..0000000000
--- a/tests/test_store/test_stateful_hierarchy.py
+++ /dev/null
@@ -1,223 +0,0 @@
-import hypothesis.extra.numpy as npst
-import hypothesis.strategies as st
-import pytest
-from hypothesis import assume, note
-from hypothesis.stateful import (
-    RuleBasedStateMachine,
-    Settings,
-    initialize,
-    invariant,
-    precondition,
-    rule,
-    run_state_machine_as_test,
-)
-
-import zarr
-from zarr import Array
-from zarr.abc.store import Store
-from zarr.core.sync import SyncMixin
-from zarr.storage import MemoryStore, ZipStore
-from zarr.testing.strategies import node_names, np_array_and_chunks, numpy_arrays
-
-
-def split_prefix_name(path):
-    split = path.rsplit("/", maxsplit=1)
-    if len(split) > 1:
-        prefix, name = split
-    else:
-        prefix = ""
-        (name,) = split
-    return prefix, name
-
-
-class ZarrHierarchyStateMachine(SyncMixin, RuleBasedStateMachine):
-    """
-    This state machine models operations that modify a zarr store's
-    hierarchy. That is, user actions that modify arrays/groups as well
-    as list operations. It is intended to be used by external stores, and
-    compares their results to a MemoryStore that is assumed to be perfect.
-    """
-
-    def __init__(self, store) -> None:
-        super().__init__()
-
-        self.store = store
-
-        self.model = MemoryStore()
-        zarr.group(store=self.model)
-
-        # Track state of the hierarchy, these should contain fully qualified paths
-        self.all_groups = set()
-        self.all_arrays = set()
-
-    @initialize()
-    def init_store(self):
-        # This lets us reuse the fixture provided store.
-        self._sync(self.store.clear())
-        zarr.group(store=self.store)
-
-    def can_add(self, path):
-        return path not in self.all_groups and path not in self.all_arrays
-
-    # -------------------- store operations -----------------------
-    @rule(name=node_names, data=st.data())
-    def add_group(self, name, data):
-        if self.all_groups:
-            parent = data.draw(st.sampled_from(sorted(self.all_groups)), label="Group parent")
-        else:
-            parent = ""
-        path = f"{parent}/{name}".lstrip("/")
-        assume(self.can_add(path))
-        note(f"Adding group: path='{path}'")
-        self.all_groups.add(path)
-        zarr.group(store=self.store, path=path)
-        zarr.group(store=self.model, path=path)
-
-    @rule(
-        data=st.data(),
-        name=node_names,
-        array_and_chunks=np_array_and_chunks(arrays=numpy_arrays(zarr_formats=st.just(3))),
-    )
-    def add_array(self, data, name, array_and_chunks):
-        array, chunks = array_and_chunks
-        fill_value = data.draw(npst.from_dtype(array.dtype))
-        if self.all_groups:
-            parent = data.draw(st.sampled_from(sorted(self.all_groups)), label="Array parent")
-        else:
-            parent = ""
-        # TODO: support creating deeper paths
-        # TODO: support overwriting potentially by just skipping `self.can_add`
-        path = f"{parent}/{name}".lstrip("/")
-        assume(self.can_add(path))
-        note(f"Adding array:  path='{path}'  shape={array.shape}  chunks={chunks}")
-        for store in [self.store, self.model]:
-            zarr.array(array, chunks=chunks, path=path, store=store, fill_value=fill_value)
-        self.all_arrays.add(path)
-
-    # @precondition(lambda self: bool(self.all_groups))
-    # @precondition(lambda self: bool(self.all_arrays))
-    # @rule(data=st.data())
-    # def move_array(self, data):
-    #     array_path = data.draw(st.sampled_from(self.all_arrays), label="Array move source")
-    #     to_group = data.draw(st.sampled_from(self.all_groups), label="Array move destination")
-
-    #     # fixme renaiming to self?
-    #     array_name = os.path.basename(array_path)
-    #     assume(self.model.can_add(to_group, array_name))
-    #     new_path = f"{to_group}/{array_name}".lstrip("/")
-    #     note(f"moving array '{array_path}' -> '{new_path}'")
-    #     self.model.rename(array_path, new_path)
-    #     self.repo.store.rename(array_path, new_path)
-
-    # @precondition(lambda self: len(self.all_groups) >= 2)
-    # @rule(data=st.data())
-    # def move_group(self, data):
-    #     from_group = data.draw(st.sampled_from(self.all_groups), label="Group move source")
-    #     to_group = data.draw(st.sampled_from(self.all_groups), label="Group move destination")
-    #     assume(not to_group.startswith(from_group))
-
-    #     from_group_name = os.path.basename(from_group)
-    #     assume(self.model.can_add(to_group, from_group_name))
-    #     # fixme renaiming to self?
-    #     new_path = f"{to_group}/{from_group_name}".lstrip("/")
-    #     note(f"moving group '{from_group}' -> '{new_path}'")
-    #     self.model.rename(from_group, new_path)
-    #     self.repo.store.rename(from_group, new_path)
-
-    @precondition(lambda self: len(self.all_arrays) >= 1)
-    @rule(data=st.data())
-    def delete_array_using_del(self, data):
-        array_path = data.draw(
-            st.sampled_from(sorted(self.all_arrays)), label="Array deletion target"
-        )
-        prefix, array_name = split_prefix_name(array_path)
-        note(f"Deleting array '{array_path}' ({prefix=!r}, {array_name=!r}) using del")
-        for store in [self.model, self.store]:
-            group = zarr.open_group(path=prefix, store=store)
-            group[array_name]  # check that it exists
-            del group[array_name]
-        self.all_arrays.remove(array_path)
-
-    @precondition(lambda self: len(self.all_groups) >= 2)  # fixme don't delete root
-    @rule(data=st.data())
-    def delete_group_using_del(self, data):
-        group_path = data.draw(
-            st.sampled_from(sorted(self.all_groups)), label="Group deletion target"
-        )
-        prefix, group_name = split_prefix_name(group_path)
-        note(f"Deleting group '{group_path=!r}', {prefix=!r}, {group_name=!r} using delete")
-        members = zarr.open_group(store=self.model, path=group_path).members(max_depth=None)
-        for _, obj in members:
-            if isinstance(obj, Array):
-                self.all_arrays.remove(obj.path)
-            else:
-                self.all_groups.remove(obj.path)
-        for store in [self.store, self.model]:
-            group = zarr.open_group(store=store, path=prefix)
-            group[group_name]  # check that it exists
-            del group[group_name]
-        if group_path != "/":
-            # The root group is always present
-            self.all_groups.remove(group_path)
-
-    # # --------------- assertions -----------------
-    # def check_group_arrays(self, group):
-    #     # note(f"Checking arrays of '{group}'")
-    #     g1 = self.model.get_group(group)
-    #     g2 = zarr.open_group(path=group, mode="r", store=self.repo.store)
-    #     model_arrays = sorted(g1.arrays(), key=itemgetter(0))
-    #     our_arrays = sorted(g2.arrays(), key=itemgetter(0))
-    #     for (n1, a1), (n2, a2) in zip_longest(model_arrays, our_arrays):
-    #         assert n1 == n2
-    #         assert_array_equal(a1, a2)
-
-    # def check_subgroups(self, group_path):
-    #     g1 = self.model.get_group(group_path)
-    #     g2 = zarr.open_group(path=group_path, mode="r", store=self.repo.store)
-    #     g1_children = [name for (name, _) in g1.groups()]
-    #     g2_children = [name for (name, _) in g2.groups()]
-    #     # note(f"Checking {len(g1_children)} subgroups of group '{group_path}'")
-    #     assert g1_children == g2_children
-
-    # def check_list_prefix_from_group(self, group):
-    #     prefix = f"meta/root/{group}"
-    #     model_list = sorted(self.model.list_prefix(prefix))
-    #     al_list = sorted(self.repo.store.list_prefix(prefix))
-    #     # note(f"Checking {len(model_list)} keys under '{prefix}'")
-    #     assert model_list == al_list
-
-    #     prefix = f"data/root/{group}"
-    #     model_list = sorted(self.model.list_prefix(prefix))
-    #     al_list = sorted(self.repo.store.list_prefix(prefix))
-    #     # note(f"Checking {len(model_list)} keys under '{prefix}'")
-    #     assert model_list == al_list
-
-    # @precondition(lambda self: self.model.is_persistent_session())
-    # @rule(data=st.data())
-    # def check_group_path(self, data):
-    #     t0 = time.time()
-    #     group = data.draw(st.sampled_from(self.all_groups))
-    #     self.check_list_prefix_from_group(group)
-    #     self.check_subgroups(group)
-    #     self.check_group_arrays(group)
-    #     t1 = time.time()
-    #     note(f"Checks took {t1 - t0} sec.")
-
-    @invariant()
-    def check_list_prefix_from_root(self):
-        model_list = self._sync_iter(self.model.list_prefix(""))
-        store_list = self._sync_iter(self.store.list_prefix(""))
-        note(f"Checking {len(model_list)} keys")
-        assert sorted(model_list) == sorted(store_list)
-
-
-def test_zarr_hierarchy(sync_store: Store):
-    def mk_test_instance_sync() -> ZarrHierarchyStateMachine:
-        return ZarrHierarchyStateMachine(sync_store)
-
-    if isinstance(sync_store, ZipStore):
-        pytest.skip(reason="ZipStore does not support delete")
-    if isinstance(sync_store, MemoryStore):
-        run_state_machine_as_test(
-            mk_test_instance_sync, settings=Settings(report_multiple_bugs=False)
-        )
diff --git a/tests/test_store/test_stateful_store.py b/tests/test_store/test_stateful_store.py
deleted file mode 100644
index 751c1ac746..0000000000
--- a/tests/test_store/test_stateful_store.py
+++ /dev/null
@@ -1,249 +0,0 @@
-# Stateful tests for arbitrary Zarr stores.
-import hypothesis.strategies as st
-import pytest
-from hypothesis import assume, note
-from hypothesis.stateful import (
-    RuleBasedStateMachine,
-    Settings,
-    initialize,
-    invariant,
-    precondition,
-    rule,
-    run_state_machine_as_test,
-)
-from hypothesis.strategies import DataObject
-
-import zarr
-from zarr.abc.store import Store
-from zarr.core.buffer import BufferPrototype, cpu, default_buffer_prototype
-from zarr.storage import LocalStore, ZipStore
-from zarr.testing.strategies import key_ranges
-from zarr.testing.strategies import keys as zarr_keys
-
-MAX_BINARY_SIZE = 100
-
-
-class SyncStoreWrapper(zarr.core.sync.SyncMixin):
-    def __init__(self, store: Store) -> None:
-        """Synchronous Store wrapper
-
-        This class holds synchronous methods that map to async methods of Store classes.
-        The synchronous wrapper is needed because hypothesis' stateful testing infra does
-        not support asyncio so we redefine sync versions of the Store API.
-        https://github.com/HypothesisWorks/hypothesis/issues/3712#issuecomment-1668999041
-        """
-        self.store = store
-
-    @property
-    def read_only(self) -> bool:
-        return self.store.read_only
-
-    def set(self, key: str, data_buffer: zarr.core.buffer.Buffer) -> None:
-        return self._sync(self.store.set(key, data_buffer))
-
-    def list(self) -> list:
-        return self._sync_iter(self.store.list())
-
-    def get(self, key: str, prototype: BufferPrototype) -> zarr.core.buffer.Buffer:
-        return self._sync(self.store.get(key, prototype=prototype))
-
-    def get_partial_values(
-        self, key_ranges: list, prototype: BufferPrototype
-    ) -> zarr.core.buffer.Buffer:
-        return self._sync(self.store.get_partial_values(prototype=prototype, key_ranges=key_ranges))
-
-    def delete(self, path: str) -> None:
-        return self._sync(self.store.delete(path))
-
-    def is_empty(self, prefix: str) -> bool:
-        return self._sync(self.store.is_empty(prefix=prefix))
-
-    def clear(self) -> None:
-        return self._sync(self.store.clear())
-
-    def exists(self, key) -> bool:
-        return self._sync(self.store.exists(key))
-
-    def list_dir(self, prefix):
-        raise NotImplementedError
-
-    def list_prefix(self, prefix: str):
-        raise NotImplementedError
-
-    def set_partial_values(self, key_start_values):
-        raise NotImplementedError
-
-    @property
-    def supports_listing(self) -> bool:
-        return self.store.supports_listing
-
-    @property
-    def supports_partial_writes(self) -> bool:
-        return self.supports_partial_writes
-
-    @property
-    def supports_writes(self) -> bool:
-        return self.store.supports_writes
-
-
-class ZarrStoreStateMachine(RuleBasedStateMachine):
-    """ "
-    Zarr store state machine
-
-        This is a subclass of a Hypothesis RuleBasedStateMachine.
-        It is testing a framework to ensure that the state of a Zarr store matches
-        an expected state after a set of random operations. It contains a store
-        (currently, a Zarr MemoryStore) and a model, a simplified version of a
-        zarr store (in this case, a dict). It also contains rules which represent
-        actions that can be applied to a zarr store. Rules apply an action to both
-        the store and the model, and invariants assert that the state of the model
-        is equal to the state of the store. Hypothesis then generates sequences of
-        rules, running invariants after each rule. It raises an error if a sequence
-        produces discontinuity between state of the model and state of the store
-        (ie. an invariant is violated).
-        https://hypothesis.readthedocs.io/en/latest/stateful.html
-    """
-
-    def __init__(self, store: Store) -> None:
-        super().__init__()
-        self.model: dict[str, bytes] = {}
-        self.store = SyncStoreWrapper(store)
-        self.prototype = default_buffer_prototype()
-
-    @initialize()
-    def init_store(self):
-        self.store.clear()
-
-    @rule(key=zarr_keys, data=st.binary(min_size=0, max_size=MAX_BINARY_SIZE))
-    def set(self, key: str, data: DataObject) -> None:
-        note(f"(set) Setting {key!r} with {data}")
-        assert not self.store.read_only
-        data_buf = cpu.Buffer.from_bytes(data)
-        self.store.set(key, data_buf)
-        self.model[key] = data_buf
-
-    @precondition(lambda self: len(self.model.keys()) > 0)
-    @rule(key=zarr_keys, data=st.data())
-    def get(self, key: str, data: DataObject) -> None:
-        key = data.draw(
-            st.sampled_from(sorted(self.model.keys()))
-        )  # hypothesis wants to sample from sorted list
-        note("(get)")
-        store_value = self.store.get(key, self.prototype)
-        # to bytes here necessary because data_buf set to model in set()
-        assert self.model[key].to_bytes() == (store_value.to_bytes())
-
-    @rule(key=zarr_keys, data=st.data())
-    def get_invalid_zarr_keys(self, key: str, data: DataObject) -> None:
-        note("(get_invalid)")
-        assume(key not in self.model)
-        assert self.store.get(key, self.prototype) is None
-
-    @precondition(lambda self: len(self.model.keys()) > 0)
-    @rule(data=st.data())
-    def get_partial_values(self, data: DataObject) -> None:
-        key_range = data.draw(
-            key_ranges(keys=st.sampled_from(sorted(self.model.keys())), max_size=MAX_BINARY_SIZE)
-        )
-        note(f"(get partial) {key_range=}")
-        obs_maybe = self.store.get_partial_values(key_range, self.prototype)
-        observed = []
-
-        for obs in obs_maybe:
-            assert obs is not None
-            observed.append(obs.to_bytes())
-
-        model_vals_ls = []
-
-        for key, byte_range in key_range:
-            start = byte_range[0] or 0
-            step = byte_range[1]
-            stop = start + step if step is not None else None
-            model_vals_ls.append(self.model[key][start:stop])
-
-        assert all(
-            obs == exp.to_bytes() for obs, exp in zip(observed, model_vals_ls, strict=True)
-        ), (
-            observed,
-            model_vals_ls,
-        )
-
-    @precondition(lambda self: len(self.model.keys()) > 0)
-    @rule(data=st.data())
-    def delete(self, data: DataObject) -> None:
-        key = data.draw(st.sampled_from(sorted(self.model.keys())))
-        note(f"(delete) Deleting {key=}")
-
-        self.store.delete(key)
-        del self.model[key]
-
-    @rule()
-    def clear(self) -> None:
-        assert not self.store.read_only
-        note("(clear)")
-        self.store.clear()
-        self.model.clear()
-
-        assert self.store.is_empty("")
-
-        assert len(self.model.keys()) == len(list(self.store.list())) == 0
-
-    @rule()
-    # Local store can be non-empty when there are subdirectories but no files
-    @precondition(lambda self: not isinstance(self.store.store, LocalStore))
-    def is_empty(self) -> None:
-        note("(is_empty)")
-
-        # make sure they either both are or both aren't empty (same state)
-        assert self.store.is_empty("") == (not self.model)
-
-    @rule(key=zarr_keys)
-    def exists(self, key: str) -> None:
-        note("(exists)")
-
-        assert self.store.exists(key) == (key in self.model)
-
-    @invariant()
-    def check_paths_equal(self) -> None:
-        note("Checking that paths are equal")
-        paths = sorted(self.store.list())
-
-        assert sorted(self.model.keys()) == paths
-
-    @invariant()
-    def check_vals_equal(self) -> None:
-        note("Checking values equal")
-        for key, val in self.model.items():
-            store_item = self.store.get(key, self.prototype).to_bytes()
-            assert val.to_bytes() == store_item
-
-    @invariant()
-    def check_num_zarr_keys_equal(self) -> None:
-        note("check num zarr_keys equal")
-
-        assert len(self.model) == len(list(self.store.list()))
-
-    @invariant()
-    def check_zarr_keys(self) -> None:
-        keys = list(self.store.list())
-
-        if not keys:
-            assert self.store.is_empty("") is True
-
-        else:
-            assert self.store.is_empty("") is False
-
-            for key in keys:
-                assert self.store.exists(key) is True
-        note("checking keys / exists / empty")
-
-
-def test_zarr_hierarchy(sync_store: Store) -> None:
-    def mk_test_instance_sync() -> None:
-        return ZarrStoreStateMachine(sync_store)
-
-    if isinstance(sync_store, ZipStore):
-        pytest.skip(reason="ZipStore does not support delete")
-    if isinstance(sync_store, LocalStore):
-        pytest.skip(reason="This test has errors")
-    run_state_machine_as_test(mk_test_instance_sync, settings=Settings(report_multiple_bugs=True))