From b25ca24737ad7b1e4e6f042a1a84c2f03627f6a6 Mon Sep 17 00:00:00 2001
From: ntfrgl <b.beronov@gmail.com>
Date: Thu, 30 Apr 2026 10:59:54 -0700
Subject: [PATCH 1/4] Introduce `ecoli.library.xarray_emitter`

---
 .gitignore                                    |   2 +-
 configs/test_configs/test_xarray_emitter.json | 117 +++
 doc/apidoc_templates/module.rst_t             |   2 -
 doc/composites.rst                            |   9 +-
 doc/conf.py                                   |  44 +-
 doc/experiments.rst                           |   3 +
 doc/stores.rst                                |   2 +
 doc/workflows.rst                             |   5 +
 ecoli/__init__.py                             |   2 +
 ecoli/experiments/ecoli_master_sim.py         | 196 +++--
 ecoli/library/emitter.py                      | 168 ++++
 ecoli/library/parquet_emitter.py              | 102 ++-
 ecoli/library/test_parquet_emitter.py         | 284 +++----
 ecoli/library/test_utils.py                   |  99 +++
 ecoli/library/xarray_emitter/__init__.py      | 288 +++++++
 ecoli/library/xarray_emitter/emit_path.py     | 136 +++
 .../library/xarray_emitter/emit_predicate.py  | 225 +++++
 ecoli/library/xarray_emitter/emitter.py       | 233 +++++
 ecoli/library/xarray_emitter/storage.py       | 369 ++++++++
 .../xarray_emitter/test_xarray_emitter.py     | 300 +++++++
 ecoli/library/xarray_emitter/transducer.py    | 601 +++++++++++++
 ecoli/library/xarray_emitter/utils.py         |  65 ++
 ecoli/library/xarray_emitter/view.py          | 386 +++++++++
 ecoli/library/xarray_emitter/writer.py        | 523 ++++++++++++
 ecoli/library/xarray_emitter/zarr_writer.py   | 801 ++++++++++++++++++
 ecoli/processes/engine_process.py             |  27 +-
 ecoli/processes/listeners/mass_listener.py    |   4 +-
 pyproject.toml                                |   8 +
 pytest.ini                                    |   6 +
 runscripts/test_workflow.py                   | 304 ++++++-
 uv.lock                                       |  80 +-
 31 files changed, 5086 insertions(+), 305 deletions(-)
 create mode 100644 configs/test_configs/test_xarray_emitter.json
 create mode 100644 ecoli/library/emitter.py
 create mode 100644 ecoli/library/test_utils.py
 create mode 100644 ecoli/library/xarray_emitter/__init__.py
 create mode 100644 ecoli/library/xarray_emitter/emit_path.py
 create mode 100644 ecoli/library/xarray_emitter/emit_predicate.py
 create mode 100644 ecoli/library/xarray_emitter/emitter.py
 create mode 100644 ecoli/library/xarray_emitter/storage.py
 create mode 100644 ecoli/library/xarray_emitter/test_xarray_emitter.py
 create mode 100644 ecoli/library/xarray_emitter/transducer.py
 create mode 100644 ecoli/library/xarray_emitter/utils.py
 create mode 100644 ecoli/library/xarray_emitter/view.py
 create mode 100644 ecoli/library/xarray_emitter/writer.py
 create mode 100644 ecoli/library/xarray_emitter/zarr_writer.py

diff --git a/.gitignore b/.gitignore
index cf55a3998..514d3deff 100644
--- a/.gitignore
+++ b/.gitignore
@@ -69,4 +69,4 @@ trace-*
 test_sherlock/
 
 # SMS API #
-.hpc_env
\ No newline at end of file
+.hpc_env
diff --git a/configs/test_configs/test_xarray_emitter.json b/configs/test_configs/test_xarray_emitter.json
new file mode 100644
index 000000000..0c4532c71
--- /dev/null
+++ b/configs/test_configs/test_xarray_emitter.json
@@ -0,0 +1,117 @@
+{
+  "experiment_id": "test_xarray_emitter",
+  "fixed_media": "minimal",
+  "suffix_time": false,
+  "max_duration": 10.0,
+  "fail_at_max_duration": false,
+  "generations": 1,
+  "n_init_sims": 1,
+  "log_updates": true,
+  "emitter": "xarray",
+  "emitter_arg": {
+    "debug": false,
+    "transducer": {
+      "predicate": [
+        [
+          {"subsample": {"interval": 1}},
+          {"fixed": {"steps": [0]}}
+        ]
+      ],
+      "buffer": {
+        "size": 3
+      }
+    },
+    "writer": {
+      "store": "out/store",
+      "threaded": true,
+      "buffers_per_chunk": 2,
+      "backend": "zarr",
+      "backend_config": {
+        "format": 3,
+        "async.concurrency": 3,
+        "threading.max_workers": 3
+      }
+    },
+    "view": [
+      {
+        "root": [],
+        "variables": {
+          "bulk": [{
+            "path": "bulk/bulk_molecule",
+            "dtype": "<i8",
+            "codecs": {
+              "filters_v2": [],
+              "filters_v3": [],
+              "compressors_v2": [{
+                "id": "lzma", "format": 3, "check": -1, "preset": null,
+                "filters": [{"id": 3, "dist": 8}, {"id": 33, "preset": 5}]
+              }],
+              "compressors_v3": [{
+                "name": "numcodecs.lzma",
+                "configuration": {
+                  "format": 3,
+                  "filters": [{"id": 3, "dist": 8}, {"id": 33, "preset": 5}]
+                }
+              }]
+            }
+          }]
+        }
+      },
+      {
+        "root": ["listeners", "mass"],
+        "metadata": false,
+        "variables": {
+          "cell_mass": [{
+            "path": "gauges/cell_mass",
+            "unit": "[fg]",
+            "dtype": "<f4"
+          }],
+          "dry_mass": [{
+            "path": "gauges/dry_mass",
+            "unit": "[fg]",
+            "dtype": "<f4"
+          }]
+        }
+      },
+      {
+        "root": ["log_update", "ecoli-metabolism", "listeners"],
+        "variables": {
+          "fba_results": {
+            "coefficient": [{
+              "path": "gauges/mass_per_vol",
+              "unit": "[g/L]",
+              "dtype": "<f4"
+            }],
+            "reaction_fluxes": [{
+              "path": "metabolism/fluxes/internal/rxn",
+              "unit": "[mmol/L.s]",
+              "dtype": "<f4"
+            }],
+            "external_exchange_fluxes": [{
+              "path": "metabolism/fluxes/exchange/molecule",
+              "unit": "[mmol/g.h]",
+              "dtype": "<f4"
+            }]
+          },
+          "enzyme_kinetics": {
+            "counts_to_molar": [{
+              "path": "gauges/conc_per_count",
+              "unit": "[mmol/L]",
+              "dtype": "<f4"
+            }],
+            "actual_fluxes": [{
+              "path": "metabolism/fluxes/internal/rxn_constrained",
+              "unit": "[mmol/L.s]",
+              "dtype": "<f4"
+            }],
+            "target_fluxes": [{
+              "path": "metabolism/fluxes/internal/rxn_target",
+              "unit": "[mmol/L.s]",
+              "dtype": "<f4"
+            }]
+          }
+        }
+      }
+    ]
+  }
+}
diff --git a/doc/apidoc_templates/module.rst_t b/doc/apidoc_templates/module.rst_t
index f4aee8c67..f2a49a57e 100644
--- a/doc/apidoc_templates/module.rst_t
+++ b/doc/apidoc_templates/module.rst_t
@@ -1,7 +1,5 @@
 {{- "``{}``".format(basename) | heading }}
 .. automodule:: {{ qualname }}
-   :private-members:
-   :exclude-members: _abc_impl 
 {%- for option in automodule_options %}
    :{{ option }}:
 {%- endfor %}
diff --git a/doc/composites.rst b/doc/composites.rst
index 73083f264..35cd0cce1 100644
--- a/doc/composites.rst
+++ b/doc/composites.rst
@@ -72,6 +72,9 @@ their corresponding topologies to the final composite model.
 - ``generations``: Adds :py:class:`~ecoli.processes.cell_division.StopAfterDivision`
   when ``True`` but only if ``divide`` is ``True``
 
+
+.. _log_updates:
+
 -----------
 Log Updates
 -----------
@@ -90,8 +93,10 @@ The analysis plots located in :py:mod:`~ecoli.analysis.single.blame` can be used
 to visualize these updates.
 
 .. warning::
-    This feature should only be turned for debugging purposes and
-    only when using the in-memory emitter (see :ref:`ram_emitter`).
+    This feature should only be turned on for debugging purposes, and only when
+    using the :ref:`in-memory emitter <ram_emitter>` or the
+    :py:mod:`.xarray_emitter`.
+
 
 -------------
 Initial State
diff --git a/doc/conf.py b/doc/conf.py
index 9abcc5c31..06ffe1a0e 100644
--- a/doc/conf.py
+++ b/doc/conf.py
@@ -86,6 +86,20 @@
     # Silence warning in ecoli.processes.environment.field_timeline.FieldTimeline
     ("py:class", "vivarium.processes.timeline.TimelineProcess"),
     ("py:class", "concurrent.futures._base.Future"),
+    # Type annotations using library internals
+    ("py:class", "concurrent.futures._base.Executor"),
+    ("py:class", "unittest.mock._patch"),
+    ("py:class", "xarray.backends.common.ArrayWriter"),
+    ("py:class", "xarray.core.treenode.NodePath"),
+    ("py:class", "zarr.core.group.ConsolidatedMetadata"),
+    ("py:class", "zarr.core._tree.TreeRepr"),
+    # Sphinx does not recognize type parameters in generic classes
+    ("py:class", "ArrT"),
+    ("py:class", "NodeT"),
+    ("py:class", "StoreT"),
+    # Sphinx does not recognize type aliases
+    ("py:type", "VariableEncoding"),
+    ("py:class", "VariableEncoding"),
 ]
 
 
@@ -115,15 +129,17 @@
 # -- sphinx.ext.intersphinx options --
 intersphinx_mapping = {
     "python": ("https://docs.python.org/3", None),
-    "vivarium": (
-        "https://vivarium-core.readthedocs.io/en/latest/",
-        None,
-    ),
+    "pytest": ("https://docs.pytest.org/en/latest", None),
+    "vivarium": ("https://vivarium-core.readthedocs.io/en/latest/", None),
     "numpy": ("https://numpy.org/doc/stable", None),
+    "xarray": ("https://docs.xarray.dev/en/latest", None),
+    "zarr": ("https://zarr.readthedocs.io/en/latest", None),
     "matplotlib": ("https://matplotlib.org/stable/", None),
     "pandas": ("http://pandas.pydata.org/pandas-docs/dev", None),
     "polars": ("https://docs.pola.rs/api/python/stable", None),
     "sympy": ("https://docs.sympy.org/latest", None),
+    "pint": ("https://pint.readthedocs.io/en/stable", None),
+    "unum": ("https://unum.readthedocs.io/en/stable", None),
 }
 
 
@@ -143,8 +159,24 @@
 ]
 # Move typehints from signature into description
 autodoc_typehints = "description"
-# Concatenate class and __init__ docstrings
-autoclass_content = "both"
+# Only use the class’s docstring. __init__ docstrings are now listed separately.
+autoclass_content = "class"
+# Default options for all autodoc directives.
+autodoc_default_options = {
+    "member-order": "bysource",
+    "private-members": True,
+    "special-members": (
+        # object
+        "__init__,  __del__, __call__"
+    ),
+    "exclude-members": (
+        # abc.ABC
+        "_abc_impl, "
+        # enum.Flag
+        "_flag_mask_, _singles_mask_, _all_bits_, _boundary_, _inverted_, "
+        "_generate_next_value_"
+    )
+}
 # Remove domain objects (e.g. functions, classes, attributes) from
 # table of contents
 toc_object_entries = False
diff --git a/doc/experiments.rst b/doc/experiments.rst
index 9e6a423e2..2fe680faa 100644
--- a/doc/experiments.rst
+++ b/doc/experiments.rst
@@ -396,6 +396,9 @@ Here are some general rules to remember when writing your own JSON config files:
     without dividing, this results in a more informative error message instead
     of a Nextflow error about missing daughter cell states.
 
+
+.. _experiment_output:
+
 ------
 Output
 ------
diff --git a/doc/stores.rst b/doc/stores.rst
index d1a379355..4a28d433d 100644
--- a/doc/stores.rst
+++ b/doc/stores.rst
@@ -368,6 +368,8 @@ any number of attributes for all active (``_entryState`` is 1) unique molecules
 of a given type (e.g. RNA, active RNAP, etc.).
 
 
+.. _listeners:
+
 ---------
 Listeners
 ---------
diff --git a/doc/workflows.rst b/doc/workflows.rst
index d015d0dc0..4a1848e5c 100644
--- a/doc/workflows.rst
+++ b/doc/workflows.rst
@@ -330,6 +330,7 @@ it has access to.
   folder, you can just create stub files in the appropriate folders
   that simply import the ``plot`` function from a primary analysis script.
 
+
 .. _analysis_config:
 
 Configuration
@@ -502,6 +503,9 @@ Refer to :ref:`/output.rst` for more information about how
 to use DuckDB to read and analyze simulation output inside
 analysis scripts.
 
+
+.. _workflows:
+
 ---------
 Workflows
 ---------
@@ -700,6 +704,7 @@ is a list workflow behaviors enabled in our model to handle unexpected errors.
   depends on generation 6, :py:mod:`runscripts.create_variants` depends on
   :py:mod:`runscripts.parca`, etc).
 
+
 .. _output:
 
 ------
diff --git a/ecoli/__init__.py b/ecoli/__init__.py
index 673b8391f..24e2c5c2f 100644
--- a/ecoli/__init__.py
+++ b/ecoli/__init__.py
@@ -6,6 +6,7 @@
 )
 
 from ecoli.library.parquet_emitter import ParquetEmitter
+from ecoli.library.xarray_emitter.emitter import XarrayEmitter
 from ecoli.library.schema import (
     divide_binomial,
     divide_bulk,
@@ -39,6 +40,7 @@
 faulthandler.enable()
 
 emitter_registry.register("parquet", ParquetEmitter)
+emitter_registry.register("xarray", XarrayEmitter)
 
 # register :term:`updaters`
 inverse_updater_registry.register("accumulate", inverse_update_accumulate)
diff --git a/ecoli/experiments/ecoli_master_sim.py b/ecoli/experiments/ecoli_master_sim.py
index b77bc2be9..efa2aca2e 100644
--- a/ecoli/experiments/ecoli_master_sim.py
+++ b/ecoli/experiments/ecoli_master_sim.py
@@ -24,15 +24,16 @@
 import numpy as np
 from fsspec import open as fsspec_open
 from vivarium.core.engine import Engine
-from vivarium.core.composer import deep_merge
+from vivarium.core.composer import Composite, deep_merge
 from vivarium.core.process import Process
 from vivarium.core.serialize import deserialize_value, serialize_value
 from vivarium.library.dict_utils import deep_merge_check
 from vivarium.library.topology import inverse_topology
 from vivarium.library.topology import assoc_path, get_in
 from ecoli.library.logging_tools import write_json
-from wholecell.utils.filepath import cloud_path_join
+from ecoli.library.parquet_emitter import BufferedEmitter
 import ecoli.composites.ecoli_master
+from wholecell.utils.filepath import cloud_path_join
 
 # Environment composer for spatial environment sim
 import ecoli.composites.environment.lattice
@@ -42,7 +43,6 @@
 from ecoli.processes.registries import topology_registry
 
 from configs import CONFIG_DIR_PATH
-from ecoli.library.parquet_emitter import ParquetEmitter
 from ecoli.library.schema import not_a_process
 
 from wholecell.utils.filepath import ROOT_PATH
@@ -256,6 +256,7 @@ def __init__(
             self.parser.add_argument(
                 "--experiment_id",
                 action="store",
+                type=str,
                 help=(
                     "ID for this experiment. A UUID will be generated if "
                     'this argument is not used and "experiment_id" is null '
@@ -346,8 +347,7 @@ def __init__(
                 "--variant", action="store", help="Name of variant."
             )
             self.parser.add_argument(
-                "--lineage_seed",
-                action="store",
+                "--lineage_seed", action="store", type=int,
                 help="Seed used for first cell in lineage.",
             )
             self.parser.add_argument(
@@ -467,15 +467,19 @@ def __init__(self, config: dict[str, Any]):
 
         # Keep track of base experiment id
         # in case multiple simulations are run with suffix_time = True.
-        self.experiment_id_base = config["experiment_id"]
+        self.experiment_id: str
+        self.experiment_id_base: str = config["experiment_id"]
         self.config = config
-        self.ecoli = None
-        """vivarium.core.composer.Composite: Contains the fully instantiated 
-        processes, steps, topologies, and flow necessary to run simulation. 
-        Generated by 
+        self.emitter_config: dict[str, Any] = {}
+
+        self.ecoli: Composite
+        """
+        Contains the fully instantiated processes, steps, topologies, and flow
+        necessary to run simulation. Generated by
         :py:meth:`~ecoli.experiments.ecoli_master_sim.EcoliSim.build_ecoli` and 
         cleared when :py:meth:`~ecoli.experiments.ecoli_master_sim.EcoliSim.run` 
-        is called to potentially free up memory after division."""
+        is called to potentially free up memory after division.
+        """
         self.generated_initial_state = None
         """dict: Fully populated initial state for simulation. Generated by 
         :py:meth:`~ecoli.experiments.ecoli_master_sim.EcoliSim.build_ecoli` and 
@@ -744,60 +748,77 @@ def build_ecoli(self):
                 initial_environment, self.generated_initial_state
             )
 
-    def update_experiment(self, time_to_update: float = 0.0):
+    def update_experiment(
+        self, time_to_update: float = 0.0, finalize: bool = True
+    ) -> None:
         """
-        Runs the E. coli simulation for a specified amount of time. If the
-        simulation reaches a division event and ``config['generations']`` is set,
-        it will save the daughter cell states to JSON files in the directory
-        specified by ``config['daughter_outdir']``. Also creates a file
-        ``division_time.sh`` that, when executed, sets the environment variable
-        ``division_time`` to the time at which division occurred (used in
-        Nextflow workflow runs).
+        Run the E. coli simulation for a specified amount of time. If the
+        simulation reaches a division event during this time and
+        ``config['generations']`` is set, then :py:meth:`~.persist_generation`
+        will be called and the Python interpreter will be terminated.
+
+        Called by: :py:meth:`.run` or :py:meth:`.save_states`.
         """
         try:
-            self.ecoli_experiment.update(time_to_update)
+            success = False
+            if time_to_update > 0:
+                self.ecoli_experiment.update(time_to_update)
         except DivisionDetected:
-            state = self.ecoli_experiment.state.get_value(condition=not_a_process)
-            assert len(state["agents"]) == 2
-            # Daughter state should include all of the additional
-            # non-agent state (e.g. environment state)
-            non_agent_state = {k: v for k, v in state.items() if k != "agents"}
-            for i, (agent_id, agent_state) in enumerate(state["agents"].items()):
-                prepare_save_state(agent_state)
-                daughter_filename = f"daughter_state_{i}.json"
-                daughter_path = cloud_path_join(self.daughter_outdir, daughter_filename)
-                write_json(
-                    daughter_path,
-                    {**non_agent_state, "agents": {agent_id: agent_state}},
-                )
-                # Write daughter state URI to local file for Nextflow to read
-                with open(f"daughter_state_{i}_uri.txt", "w") as f:
-                    f.write(daughter_path)
-            print(
-                f"Divided at t = {self.ecoli_experiment.global_time} after "
-                f"{self.ecoli_experiment.global_time - self.initial_global_time} sec."
+            success = True
+            self.persist_generation()
+        finally:
+            # Don't start new I/O operations during a manual shutdown.
+            if not isinstance(sys.exception(), KeyboardInterrupt):
+                if isinstance(emitter := self.ecoli_experiment.emitter, BufferedEmitter):
+                    # Finish writing buffered emits to persistent storage,
+                    # unless called inside the `.save_states()` loop.
+                    if finalize:
+                        emitter.finalize(success=success)
+                if success:
+                    # Exit so that `.run()` does not raise `TimeLimitError`.
+                    sys.exit()
+
+    def persist_generation(self, *, num_agents: int = 2) -> None:
+        """
+        Upon reaching cell division, save the daughter cell states to JSON files
+        in the directory specified by ``config['daughter_outdir']``. Also,
+        create a file ``division_time.sh`` that, when executed, sets the
+        environment variable ``division_time`` to the time at which division
+        occurred, as expected by
+        ``runscripts/nextflow/sim.nf::{simGen0,sim}.output``.
+
+        Called by: :py:meth:`~.update_experiment`.
+
+        Args:
+            num_agents: Expected number of cells. This argument exists solely
+                        for testing purposes.
+        """
+        state = self.ecoli_experiment.state.get_value(condition=not_a_process)
+        assert len(state["agents"]) == num_agents
+        # Daughter state should include all of the additional
+        # non-agent state (e.g. environment state)
+        non_agent_state = {k: v for k, v in state.items() if k != "agents"}
+        for i, (agent_id, agent_state) in enumerate(state["agents"].items()):
+            prepare_save_state(agent_state)
+            daughter_filename = f"daughter_state_{i}.json"
+            daughter_path = cloud_path_join(self.daughter_outdir, daughter_filename)
+            write_json(
+                daughter_path,
+                {**non_agent_state, "agents": {agent_id: agent_state}},
             )
-            # Nextflow workflows will source division time to determine
-            # initial global time to use for daughter cells
-            with open("division_time.sh", "w") as f:
-                f.write(f"export division_time={self.ecoli_experiment.global_time}")
-            # Tell Parquet emitter that simulation was successful
-            if isinstance(self.ecoli_experiment.emitter, ParquetEmitter):
-                self.ecoli_experiment.emitter.success = True
-                self.ecoli_experiment.emitter.finalize()
-            # Exit so that EcoliSim.run() does not raise TimeLimitError
-            sys.exit()
-        except:  # noqa: E722
-            # Finish writing any buffered emits to Parquet files if the simulation
-            # encounters any error (including KeyboardInterrupt)
-            # We use a bare except instead of finally because we don't want to
-            # run finalize() every time update_experiment is called to advance to
-            # save times in save_states()
-            if isinstance(self.ecoli_experiment.emitter, ParquetEmitter):
-                self.ecoli_experiment.emitter.finalize()
-            raise
-
-    def save_states(self):
+            # Write daughter state URI to local file for Nextflow to read
+            with open(f"daughter_state_{i}_uri.txt", "w") as f:
+                f.write(daughter_path)
+        print(
+            f"Divided at t = {self.ecoli_experiment.global_time} after "
+            f"{self.ecoli_experiment.global_time - self.initial_global_time} sec."
+        )
+        # Nextflow workflows will source division time to determine
+        # initial global time to use for daughter cells
+        with open("division_time.sh", "w") as f:
+            f.write(f"export division_time={self.ecoli_experiment.global_time}")
+
+    def save_states(self) -> None:
         """
         Runs the simulation while saving the states of specific
         timesteps to files named ``data/vivecoli_t{time}.json``. Invoked by
@@ -805,6 +826,10 @@ def save_states(self):
         if ``config['save'] == True``. State is saved as a JSON that
         can be reloaded into a simulation as described in
         :py:meth:`~ecoli.composites.ecoli_master.Ecoli.initial_state`.
+
+        Called by: :py:meth:`.run`.
+
+        Calls: :py:meth:`~.update_experiment`.
         """
         for time in self.save_times:
             if time > self.max_duration:
@@ -818,7 +843,7 @@ def save_states(self):
                 time_to_next_save = self.save_times[i]
             else:
                 time_to_next_save = self.save_times[i] - self.save_times[i - 1]
-            self.update_experiment(time_to_next_save)
+            self.update_experiment(time_to_next_save, finalize=False)
             time_elapsed = self.save_times[i]
             state = self.ecoli_experiment.state.get_value(condition=not_a_process)
             if self.divide:
@@ -829,18 +854,19 @@ def save_states(self):
             write_json("data/vivecoli_t" + str(time_elapsed) + ".json", state)
             print("Finished saving the state at t = " + str(time_elapsed))
         time_remaining = self.max_duration - self.save_times[-1]
-        if time_remaining:
-            self.update_experiment(time_remaining)
+        self.update_experiment(time_remaining)
 
-    def run(self):
-        """Create and run an EcoliSim experiment. If the simulation reaches
+    def run(self) -> None:
+        """
+        Create and run an EcoliSim experiment. If the simulation reaches
         the maximum duration specified by ``config['max_duration']``, it will
         raise a :py:class:`~ecoli.experiments.ecoli_master_sim.TimeLimitError`
         if ``config['fail_at_max_duration']`` is ``True``.
 
+        Calls: :py:meth:`~.update_experiment` or :py:meth:`~.save_states`.
+
         .. WARNING::
-            Run :py:meth:`~ecoli.experiments.ecoli_master_sim.EcoliSim.build_ecoli`
-            before calling :py:meth:`~ecoli.experiments.ecoli_master_sim.EcoliSim.run`!
+            Run :py:meth:`~.build_ecoli` before calling :py:meth:`~.run`!
         """
         if self.ecoli is None:
             raise RuntimeError(
@@ -857,15 +883,22 @@ def run(self):
                 for key, value in self.emitter_arg.items():
                     self.emitter_config[key] = value
             if self.emitter == "parquet":
-                if ("out_dir" not in self.emitter_config) and (
-                    "out_uri" not in self.emitter_config
-                ):
-                    raise RuntimeError(
+                if not any(map(self.emitter_config.__contains__,
+                               ["out_dir", "out_uri"])):
+                    raise KeyError(
                         "Must provide out_dir or out_uri"
-                        " as emitter argument for parquet emitter."
-                    )
+                        " as emitter argument for parquet emitter.")
+            elif self.emitter == "xarray":
+                if not (
+                    not any(map(self.emitter_config.__contains__,
+                                ["out_dir", "out_uri"]))
+                    and "store" in self.emitter_config.get("writer", {})
+                ):
+                    raise KeyError(
+                        "For {\"emitter\": \"xarray\"}, please provide:\n"
+                        "  {\"emitter_arg\": {\"writer\": {\"store\": ... }}}")
         else:
-            raise RuntimeError(
+            raise TypeError(
                 "Emitter option must be a string"
                 " representing the emitter type with any additional config"
                 " options under the emitter_arg key."
@@ -903,6 +936,10 @@ def run(self):
                     f" != {parse.quote_plus(self.experiment_id)}"
                 )
             experiment_config["experiment_id"] = self.experiment_id
+            # Ensure that `suffix_time` is in effect for all duplicates
+            # of `experiment_id`
+            assert metadata["experiment_id"] == self.experiment_id_base
+            metadata["experiment_id"] = self.experiment_id
         experiment_config["profile"] = self.profile
 
         # Since unique numpy updater is an class method, internal
@@ -917,12 +954,11 @@ def run(self):
         self.ecoli_experiment = Engine(**experiment_config)
 
         # Only emit designated stores if specified
-        if self.config["emit_paths"]:
-            self.ecoli_experiment.state.set_emit_values([tuple()], False)
-            self.ecoli_experiment.state.set_emit_values(
-                self.config["emit_paths"],
-                True,
-            )
+        if isinstance(emitter := self.ecoli_experiment.emitter, BufferedEmitter):
+            emitter.reset_emit_flags(
+                engine=self.ecoli_experiment,
+                agent=("agents", self.agent_id),
+                emit_paths=self.config["emit_paths"])
 
         # Clean up unnecessary references
         self.generated_initial_state = None
diff --git a/ecoli/library/emitter.py b/ecoli/library/emitter.py
new file mode 100644
index 000000000..095a68b22
--- /dev/null
+++ b/ecoli/library/emitter.py
@@ -0,0 +1,168 @@
+
+"""
+Extensions to the :py:class:`~vivarium.core.emitter.Emitter` interface, as used
+by :py:class:`.ParquetEmitter` and :py:class:`.XarrayEmitter`.
+"""
+
+
+from __future__ import annotations
+
+from abc import ABC, abstractmethod
+from concurrent.futures import Future, Executor
+from dataclasses import dataclass, field, replace
+from typing import Any, Callable, Self
+from urllib import parse
+from warnings import warn
+
+from vivarium.core.types import HierarchyPath
+from vivarium.core.engine import Engine
+from vivarium.core.emitter import Emitter
+
+
+# ==============================================================================
+
+
+class BlockingExecutor(Executor):
+
+    def __init__(self, *args) -> None:
+        assert not len(args)
+        super().__init__()
+
+    def submit(self, fn: Callable, /, *args, **kwargs) -> Future:
+        """
+        Run a function in the current thread, and return a
+        :py:class:`~concurrent.futures.Future` that is already done.
+        """
+        future: Future = Future()
+        try:
+            result = fn(*args, **kwargs)
+            future.set_result(result)
+        except Exception as e:
+            future.set_exception(e)
+        return future
+
+    def shutdown(self, wait=True, *, cancel_futures=False) -> None:
+        pass
+
+
+# ==============================================================================
+
+
+@dataclass(eq=True, kw_only=True, slots=True)
+class StoragePartition:
+    """
+    Metadata determining the relative storage location for the simulation
+    outputs of a single-generation :py:class:`.EcoliSim`, inside a hive
+    partition or hierarchical store (see :ref:`parquet_emitter`).
+    """
+
+    experiment_id: str
+    variant: int
+    lineage_seed: int
+    generation: int = field(init=False)
+    agent_id: str
+
+    def __post_init__(self) -> None:
+        assert isinstance(self.experiment_id, str)
+        assert isinstance(self.variant, int)
+        assert isinstance(self.lineage_seed, int)
+        assert isinstance(self.agent_id, str)
+        self.generation = len(self.agent_id)
+        assert self.generation > 0
+
+    @property
+    def parent(self) -> Self:
+        """
+        Metadata of the mother cell in the same cell lineage.
+        """
+        return replace(self, agent_id=self.agent_id[:-1])
+
+
+# ==============================================================================
+
+
+class BufferedEmitter(Emitter, ABC):
+    """
+    An extension to the :py:class:`~vivarium.core.emitter.Emitter` interface
+    that buffers emitted simulation data before writing it to persistent
+    storage. In particular, this interface is used by
+    :py:meth:`.EcoliSim.update_experiment` and
+    :py:meth:`.EngineProcess.next_update`.
+
+    .. warning::
+        :py:meth:`~.finalize` must be explicitly called in a
+        ``try ... finally ...`` block around the call to
+        :py:meth:`vivarium.core.engine.Engine.update`, in order to ensure that
+        all buffered emits are written out when the simulation terminates for
+        any reason.
+    """
+
+    def __init__(self) -> None:
+        """
+        .. warning::
+            This method should be called **at the end** of a subclass
+            ``__init__()``.
+        """
+        self.finalized: bool = False
+        """
+        Flag set by :py:meth:`.finalize` after writing the last buffer.
+        """
+
+    @abstractmethod
+    def reset_emit_flags(
+        self, *,
+        engine: Engine, agent: HierarchyPath, emit_paths: tuple[HierarchyPath]
+    ) -> None:
+        """
+        Reconfigure the simulation engine to avoid futile data marshalling, by
+        suppressing all default emissions and enabling only stores that were
+        explicitly requested by this emitter's configuration.
+
+        Called by: :py:meth:`.EcoliSim.run` or
+        :py:meth:`.EngineProcess.create_emitter`.
+        """
+        ...
+
+    def extract_partition(self, metadata: dict[str, Any], /) -> StoragePartition:
+        """
+        Define the current :py:class:`StoragePartition` from the simulation
+        metadata received via :py:meth:`!Engine._emit_configuration`.
+        """
+        return StoragePartition(
+            experiment_id=parse.quote_plus(
+                metadata.get("experiment_id", "default")),
+            variant=int(metadata.get("variant", 0)),
+            lineage_seed=int(metadata.get("lineage_seed", 0)),
+            agent_id=metadata.get("agent_id", "1"))
+
+    def finalize(self, *, success: bool = False) -> None:
+        """
+        Emit the partially filled buffer at the end of a single-generation
+        simulation.
+
+        Args:
+          success: Indicates whether the simulation reached a
+                   :py:exc:`.DivisionDetected` event.
+        """
+        if self.finalized:
+            raise RuntimeError(
+                f"`{type(self).__name__}.finalize()` was already called.")
+        assert isinstance(success, bool)
+        self._finalize(success=success)
+        self.finalized = True
+
+    @abstractmethod
+    def _finalize(self, *, success: bool) -> None:
+        """
+        Called by: :py:meth:`.finalize`.
+        """
+        ...
+
+    def __del__(self) -> None:
+        """
+        When a successfully initialised :py:class:`.BufferedEmitter` instance is
+        destroyed, check that its last batch has been flushed by the simulation
+        loop.
+        """
+        if not getattr(self, "finalized", True):
+            warn(f"\n  `{type(self).__name__}.finalize()` was never called.")
diff --git a/ecoli/library/parquet_emitter.py b/ecoli/library/parquet_emitter.py
index 5e2a9251c..607ed3765 100644
--- a/ecoli/library/parquet_emitter.py
+++ b/ecoli/library/parquet_emitter.py
@@ -1,7 +1,9 @@
+
 import os
 import fnmatch
 from concurrent.futures import Future, ThreadPoolExecutor
-from typing import Any, Callable, cast, Mapping, Optional
+from dataclasses import asdict
+from typing import Any, Callable, Mapping, Optional, cast, final
 from urllib import parse
 
 import duckdb
@@ -12,7 +14,15 @@
 from fsspec.core import filesystem, url_to_fs, OpenFile
 from fsspec.spec import AbstractFileSystem
 from tqdm import tqdm
-from vivarium.core.emitter import Emitter
+
+from vivarium.core.types import HierarchyPath
+from vivarium.core.engine import Engine
+
+from .emitter import BlockingExecutor, BufferedEmitter
+
+
+# ==============================================================================
+
 
 METADATA_PREFIX = "output_metadata__"
 """
@@ -62,6 +72,9 @@
 """uint32 is 2x smaller than int64 for values between 0 - 4,294,967,295."""
 
 
+# ==============================================================================
+
+
 def json_to_parquet(
     emit_dict: dict[str, np.ndarray | list[pl.Series]],
     outfile: str,
@@ -839,22 +852,11 @@ def pl_dtype_from_ndarray(arr: np.ndarray) -> pl.DataType:
     return pl_dtype
 
 
-class BlockingExecutor:
-    def submit(self, fn: Callable, *args, **kwargs) -> Future:
-        """
-        Run function in the current thread and return a Future that
-        is already done.
-        """
-        future: Future = Future()
-        try:
-            result = fn(*args, **kwargs)
-            future.set_result(result)
-        except Exception as e:
-            future.set_exception(e)
-        return future
+# ==============================================================================
 
 
-class ParquetEmitter(Emitter):
+@final
+class ParquetEmitter(BufferedEmitter):
     """
     Emit data to a Parquet dataset. Note that :py:meth:`~.finalize`
     must be explicitly called in a ``try...finally`` block around the call to
@@ -907,22 +909,32 @@ def __init__(self, config: dict[str, Any]) -> None:
         # was successfully written to Parquet in order to avoid blocking
         self.last_batch_future: Future = Future()
         self.last_batch_future.set_result(None)
-        # Set either by EcoliSim or by EngineProcess if sim reaches division
-        self.success = False
-
-    def finalize(self):
-        """Convert remaining batched emits to Parquet at sim shutdown
-        and mark sim as successful if ``success`` flag was set. In vEcoli,
-        this is done by :py:class:`~ecoli.experiments.ecoli_master_sim.EcoliSim`
-        upon reaching division.
+        super().__init__()
+
+    def reset_emit_flags(
+        self, *,
+        engine: Engine, agent: HierarchyPath, emit_paths: tuple[HierarchyPath]
+    ) -> None:
+        """
+        In this subclass, ``agent`` is ignored and ``emit_paths`` is interpreted
+        as a global path.
+        """
+        assert engine.emitter is self
+        if emit_paths:
+            state = self.ecoli_experiment.state
+            state.set_emit_value(emit=False, path=tuple())
+            state.set_emit_values(emit=True, paths=emit_paths)
+
+    def _finalize(self, *, success: bool):
+        """
+        Convert remaining batched emits to Parquet at sim shutdown and mark sim
+        as successful if ``success`` flag was set.
         """
         # Wait for last batch to finish writing
         self.last_batch_future.result()
         # Flush any remaining buffered emits to Parquet
         outfile = os.path.join(
-            self.out_uri,
-            self.experiment_id,
-            "history",
+            self.out_uri, self.experiment_id, "history",
             self.partitioning_path,
             f"{self.num_emits}.pq",
         )
@@ -934,11 +946,9 @@ def finalize(self):
                 self.buffered_emits, outfile, self.pl_types, self.filesystem
             )
         # Hive-partitioned directory that only contains successful sims
-        if self.success:
+        if success:
             success_file = os.path.join(
-                self.out_uri,
-                self.experiment_id,
-                "success",
+                self.out_uri, self.experiment_id, "success",
                 self.partitioning_path,
                 "s.pq",
             )
@@ -986,21 +996,10 @@ def emit(self, data: dict[str, Any]):
             data = {**data["data"].pop("metadata", {}), **data["data"]}
             data["time"] = data.get("initial_global_time", 0.0)
             # Manually create filepaths with hive partitioning
-            agent_id = data.get("agent_id", "1")
-            quoted_experiment_id = parse.quote_plus(
-                data.get("experiment_id", "default")
-            )
-            partitioning_keys = {
-                "experiment_id": quoted_experiment_id,
-                "variant": data.get("variant", 0),
-                "lineage_seed": data.get("lineage_seed", 0),
-                "generation": len(agent_id),
-                "agent_id": agent_id,
-            }
-            self.experiment_id = quoted_experiment_id
-            self.partitioning_path = os.path.join(
-                *(f"{k}={v}" for k, v in partitioning_keys.items())
-            )
+            partition = self.extract_partition(data)
+            self.partitioning_path = os.path.join(*(
+                f"{k}={v}" for (k, v) in asdict(partition).items()))
+            self.experiment_id = partition.experiment_id
             data = flatten_dict(data)
             config_emit: dict[str, Any] = {}
             config_schema: dict[str, pl.DataType] = {}
@@ -1014,9 +1013,7 @@ def emit(self, data: dict[str, Any]):
                     config_emit[k] = v
                     config_schema[k] = v.dtype
             outfile = os.path.join(
-                self.out_uri,
-                self.experiment_id,
-                "configuration",
+                self.out_uri, self.experiment_id, "configuration",
                 self.partitioning_path,
                 "config.pq",
             )
@@ -1036,7 +1033,8 @@ def emit(self, data: dict[str, Any]):
             )
             # Delete any sim output files in final filesystem
             history_outdir = os.path.join(
-                self.out_uri, self.experiment_id, "history", self.partitioning_path
+                self.out_uri, self.experiment_id, "history",
+                self.partitioning_path
             )
             try:
                 self.filesystem.delete(history_outdir, recursive=True)
@@ -1124,9 +1122,7 @@ def emit(self, data: dict[str, Any]):
             # If last batch of emits failed, exception should be raised here
             self.last_batch_future.result()
             outfile = os.path.join(
-                self.out_uri,
-                self.experiment_id,
-                "history",
+                self.out_uri, self.experiment_id, "history",
                 self.partitioning_path,
                 f"{self.num_emits}.pq",
             )
diff --git a/ecoli/library/test_parquet_emitter.py b/ecoli/library/test_parquet_emitter.py
index 526b8d10d..833d7ffaa 100644
--- a/ecoli/library/test_parquet_emitter.py
+++ b/ecoli/library/test_parquet_emitter.py
@@ -1,7 +1,5 @@
 import os
 import re
-import tempfile
-import shutil
 import duckdb
 import numpy as np
 import polars as pl
@@ -254,7 +252,7 @@ def test_union_pl_dtypes(self):
             pl.UInt32,
         ) == pl.List(pl.List(pl.List(pl.UInt32)))
 
-    def test_quote_columns(self):
+    def test_quote_columns(self, tmp_path):
         """Test quote_columns handles special characters correctly."""
         # Test single string with special characters
         assert quote_columns("simple") == '"simple"'
@@ -291,116 +289,114 @@ def test_quote_columns(self):
         assert quote_columns([]) == []
 
         # Test that quoted columns actually work in DuckDB queries with weird column names
-        with tempfile.TemporaryDirectory() as tmp_path:
-            test_file = os.path.join(tmp_path, "weird_cols.parquet")
-            # Create test data with columns containing special characters
-            test_data = pl.DataFrame(
-                {
-                    "simple": [1, 2, 3],
-                    "with spaces": [4, 5, 6],
-                    "with-hyphens": [7, 8, 9],
-                    "with[brackets]": [10, 11, 12],
-                    "with/slashes": [13, 14, 15],
-                    'has"quote': [16, 17, 18],
-                    "dot.name": [19, 20, 21],
-                    "colon:name": [22, 23, 24],
-                }
-            )
-            test_data.write_parquet(test_file, statistics=False)
-
-            conn = create_duckdb_conn()
-
-            # Test selecting individual columns with special characters
-            for col in test_data.columns:
-                quoted_col = quote_columns(col)
-                result = conn.sql(f"SELECT {quoted_col} FROM '{test_file}'").pl()
-                assert result.shape == (3, 1)
-                assert result.columns[0] == col
-                expected_values = test_data[col].to_list()
-                assert result[col].to_list() == expected_values
-
-            # Test selecting multiple columns at once
-            weird_cols = ["with spaces", "with-hyphens", "with[brackets]", 'has"quote']
-            quoted_cols = ", ".join(quote_columns(weird_cols))
-            result = conn.sql(f"SELECT {quoted_cols} FROM '{test_file}'").pl()
-            assert result.shape == (3, 4)
-            for col in weird_cols:
-                assert col in result.columns
-                assert result[col].to_list() == test_data[col].to_list()
-
-            # Test that using WHERE clause works with quoted columns
-            quoted_space_col = quote_columns("with spaces")
-            result = conn.sql(
-                f"SELECT * FROM '{test_file}' WHERE {quoted_space_col} > 4"
-            ).pl()
-            assert result.shape == (2, 8)
-            assert result["with spaces"].to_list() == [5, 6]
-
-            # Test aggregation with quoted columns
-            quoted_bracket_col = quote_columns("with[brackets]")
-            result = conn.sql(
-                f"SELECT AVG({quoted_bracket_col}) as avg_val FROM '{test_file}'"
-            ).pl()
-            assert result["avg_val"][0] == 11.0
-
-            # Test ORDER BY with quoted columns
-            quoted_slash_col = quote_columns("with/slashes")
-            result = conn.sql(
-                f"SELECT {quoted_slash_col} FROM '{test_file}' ORDER BY {quoted_slash_col} DESC"
-            ).pl()
-            assert result["with/slashes"].to_list() == [15, 14, 13]
-
-    def test_list_columns(self):
+        test_file = os.path.join(tmp_path, "weird_cols.parquet")
+        # Create test data with columns containing special characters
+        test_data = pl.DataFrame(
+            {
+                "simple": [1, 2, 3],
+                "with spaces": [4, 5, 6],
+                "with-hyphens": [7, 8, 9],
+                "with[brackets]": [10, 11, 12],
+                "with/slashes": [13, 14, 15],
+                'has"quote': [16, 17, 18],
+                "dot.name": [19, 20, 21],
+                "colon:name": [22, 23, 24],
+            }
+        )
+        test_data.write_parquet(test_file, statistics=False)
+
+        conn = create_duckdb_conn()
+
+        # Test selecting individual columns with special characters
+        for col in test_data.columns:
+            quoted_col = quote_columns(col)
+            result = conn.sql(f"SELECT {quoted_col} FROM '{test_file}'").pl()
+            assert result.shape == (3, 1)
+            assert result.columns[0] == col
+            expected_values = test_data[col].to_list()
+            assert result[col].to_list() == expected_values
+
+        # Test selecting multiple columns at once
+        weird_cols = ["with spaces", "with-hyphens", "with[brackets]", 'has"quote']
+        quoted_cols = ", ".join(quote_columns(weird_cols))
+        result = conn.sql(f"SELECT {quoted_cols} FROM '{test_file}'").pl()
+        assert result.shape == (3, 4)
+        for col in weird_cols:
+            assert col in result.columns
+            assert result[col].to_list() == test_data[col].to_list()
+
+        # Test that using WHERE clause works with quoted columns
+        quoted_space_col = quote_columns("with spaces")
+        result = conn.sql(
+            f"SELECT * FROM '{test_file}' WHERE {quoted_space_col} > 4"
+        ).pl()
+        assert result.shape == (2, 8)
+        assert result["with spaces"].to_list() == [5, 6]
+
+        # Test aggregation with quoted columns
+        quoted_bracket_col = quote_columns("with[brackets]")
+        result = conn.sql(
+            f"SELECT AVG({quoted_bracket_col}) as avg_val FROM '{test_file}'"
+        ).pl()
+        assert result["avg_val"][0] == 11.0
+
+        # Test ORDER BY with quoted columns
+        quoted_slash_col = quote_columns("with/slashes")
+        result = conn.sql(
+            f"SELECT {quoted_slash_col} FROM '{test_file}' ORDER BY {quoted_slash_col} DESC"
+        ).pl()
+        assert result["with/slashes"].to_list() == [15, 14, 13]
+
+    def test_list_columns(self, tmp_path):
         """Test list_columns retrieves column names correctly."""
-        with tempfile.TemporaryDirectory() as tmp_path:
-            # Create test Parquet file with known columns
-            test_file = os.path.join(tmp_path, "test.parquet")
-            test_data = pl.DataFrame(
-                {
-                    "col_a": [1, 2, 3],
-                    "col_b": [4.0, 5.0, 6.0],
-                    "listeners__mass__cell_mass": [7.0, 8.0, 9.0],
-                    "listeners__mass__dry_mass": [10.0, 11.0, 12.0],
-                    "listeners__growth__instantaneous_growth_rate": [0.1, 0.2, 0.3],
-                    "bulk": [[1, 2], [3, 4], [5, 6]],
-                }
-            )
-            test_data.write_parquet(test_file, statistics=False)
+        # Create test Parquet file with known columns
+        test_file = os.path.join(tmp_path, "test.parquet")
+        test_data = pl.DataFrame(
+            {
+                "col_a": [1, 2, 3],
+                "col_b": [4.0, 5.0, 6.0],
+                "listeners__mass__cell_mass": [7.0, 8.0, 9.0],
+                "listeners__mass__dry_mass": [10.0, 11.0, 12.0],
+                "listeners__growth__instantaneous_growth_rate": [0.1, 0.2, 0.3],
+                "bulk": [[1, 2], [3, 4], [5, 6]],
+            }
+        )
+        test_data.write_parquet(test_file, statistics=False)
 
-            conn = create_duckdb_conn()
-            subquery = f"SELECT * FROM '{test_file}'"
+        conn = create_duckdb_conn()
+        subquery = f"SELECT * FROM '{test_file}'"
 
-            # Test getting all columns
-            all_cols = list_columns(conn, subquery)
-            assert len(all_cols) == 6
-            assert "col_a" in all_cols
-            assert "col_b" in all_cols
-            assert "listeners__mass__cell_mass" in all_cols
+        # Test getting all columns
+        all_cols = list_columns(conn, subquery)
+        assert len(all_cols) == 6
+        assert "col_a" in all_cols
+        assert "col_b" in all_cols
+        assert "listeners__mass__cell_mass" in all_cols
 
-            # Test pattern matching with glob patterns
-            listener_cols = list_columns(conn, subquery, "listeners__*")
-            assert len(listener_cols) == 3
-            assert all(col.startswith("listeners__") for col in listener_cols)
+        # Test pattern matching with glob patterns
+        listener_cols = list_columns(conn, subquery, "listeners__*")
+        assert len(listener_cols) == 3
+        assert all(col.startswith("listeners__") for col in listener_cols)
 
-            # Test pattern matching for specific listener
-            mass_cols = list_columns(conn, subquery, "listeners__mass__*")
-            assert len(mass_cols) == 2
-            assert "listeners__mass__cell_mass" in mass_cols
-            assert "listeners__mass__dry_mass" in mass_cols
+        # Test pattern matching for specific listener
+        mass_cols = list_columns(conn, subquery, "listeners__mass__*")
+        assert len(mass_cols) == 2
+        assert "listeners__mass__cell_mass" in mass_cols
+        assert "listeners__mass__dry_mass" in mass_cols
 
-            # Test pattern that matches nothing
-            no_match = list_columns(conn, subquery, "nonexistent__*")
-            assert len(no_match) == 0
+        # Test pattern that matches nothing
+        no_match = list_columns(conn, subquery, "nonexistent__*")
+        assert len(no_match) == 0
 
-            # Test pattern with single character wildcard
-            col_pattern = list_columns(conn, subquery, "col_?")
-            assert len(col_pattern) == 2
-            assert "col_a" in col_pattern
-            assert "col_b" in col_pattern
+        # Test pattern with single character wildcard
+        col_pattern = list_columns(conn, subquery, "col_?")
+        assert len(col_pattern) == 2
+        assert "col_a" in col_pattern
+        assert "col_b" in col_pattern
 
-            # Test exact match pattern
-            exact = list_columns(conn, subquery, "bulk")
-            assert exact == ["bulk"]
+        # Test exact match pattern
+        exact = list_columns(conn, subquery, "bulk")
+        assert exact == ["bulk"]
 
 
 def compare_nested(a: list, b: list) -> bool:
@@ -420,21 +416,16 @@ def compare_nested(a: list, b: list) -> bool:
 
 
 class TestParquetEmitter:
-    @pytest.fixture
-    def temp_dir(self):
-        """Create a temporary directory for testing."""
-        tmp = tempfile.mkdtemp()
-        yield tmp
-        shutil.rmtree(tmp)
 
-    def test_initialization(self, temp_dir):
+    def test_initialization(self, tmp_path):
         """Test ParquetEmitter initialization with different configs."""
         # Test with out_dir
-        emitter = ParquetEmitter({"out_dir": temp_dir})
+        emitter = ParquetEmitter({"out_dir": tmp_path})
         emitter.experiment_id = "test_exp"
         emitter.partitioning_path = "path/to/output"
-        assert emitter.out_uri == os.path.abspath(temp_dir)
+        assert emitter.out_uri == os.path.abspath(tmp_path)
         assert emitter.batch_size == 400
+        emitter.finalized = True
 
         # Test with out_uri and custom batch size
         emitter = ParquetEmitter({"out_uri": "gs://bucket/path", "batch_size": 100})
@@ -442,10 +433,11 @@ def test_initialization(self, temp_dir):
         emitter.partitioning_path = "path/to/output"
         assert emitter.out_uri == "gs://bucket/path"
         assert emitter.batch_size == 100
+        emitter.finalized = True
 
-    def test_emit_configuration(self, temp_dir):
+    def test_emit_configuration(self, tmp_path):
         """Test emitting configuration data."""
-        emitter = ParquetEmitter({"out_dir": temp_dir})
+        emitter = ParquetEmitter({"out_dir": tmp_path})
 
         # Setup ThreadPoolExecutor mock
         future = Future()
@@ -466,6 +458,7 @@ def test_emit_configuration(self, temp_dir):
         }
 
         emitter.emit(config_data)
+        emitter.finalized = True
 
         # Verify partitioning path
         assert emitter.experiment_id == "test_exp"
@@ -477,9 +470,9 @@ def test_emit_configuration(self, temp_dir):
         args, _ = emitter.executor.submit.call_args
         assert args[0] == json_to_parquet
 
-    def test_emit_simulation_data(self, temp_dir):
+    def test_emit_simulation_data(self, tmp_path):
         """Test emitting simulation data with various types."""
-        emitter = ParquetEmitter({"out_dir": temp_dir, "batch_size": 2})
+        emitter = ParquetEmitter({"out_dir": tmp_path, "batch_size": 2})
 
         # Configuration emit to initialize variables
         config_data = {
@@ -542,6 +535,7 @@ def test_emit_simulation_data(self, temp_dir):
         emitter.emit(sim_data1)
         assert emitter.num_emits == 2
         emitter.last_batch_future.result()
+        emitter.finalized = True
 
         # Check output
         t = pl.read_parquet(
@@ -561,9 +555,9 @@ def test_emit_simulation_data(self, temp_dir):
         assert all(t["nested__value"] == [100] * 2)
         assert emitter.buffered_emits == {}
 
-    def test_variable_length_arrays(self, temp_dir):
+    def test_variable_length_arrays(self, tmp_path):
         """Test handling arrays with changing dimensions."""
-        emitter = ParquetEmitter({"out_dir": temp_dir, "batch_size": 3})
+        emitter = ParquetEmitter({"out_dir": tmp_path, "batch_size": 3})
         # Configuration emit to initialize variables
         config_data = {
             "table": "configuration",
@@ -629,6 +623,7 @@ def test_variable_length_arrays(self, temp_dir):
         # Write to Parquet and check output
         emitter.emit(sim_data2)
         emitter.last_batch_future.result()
+        emitter.finalized = True
 
         t = pl.read_parquet(
             os.path.join(
@@ -650,9 +645,9 @@ def test_variable_length_arrays(self, temp_dir):
             [[1], [1, 2], [1, 2, 3]],
         ]
 
-    def test_extreme_data_types(self, temp_dir):
+    def test_extreme_data_types(self, tmp_path):
         """Test with extreme data types and edge cases."""
-        emitter = ParquetEmitter({"out_dir": temp_dir, "batch_size": 2})
+        emitter = ParquetEmitter({"out_dir": tmp_path, "batch_size": 2})
         # Create test data with extreme values and special cases
         sim_data = {
             "table": "configuration",
@@ -790,6 +785,7 @@ def test_extreme_data_types(self, temp_dir):
         emitter.emit(sim_data_2)
         emitter.last_batch_future.result()
         assert emitter.buffered_emits == {}
+        emitter.finalized = True
 
         out_path = os.path.join(
             emitter.out_uri,
@@ -852,9 +848,9 @@ def test_extreme_data_types(self, temp_dir):
                 f"Mismatch in field {key}"
             )
 
-    def test_finalize(self, temp_dir):
+    def test_finalize(self, tmp_path):
         """Test finalize method that handles remaining data."""
-        emitter = ParquetEmitter({"out_dir": temp_dir})
+        emitter = ParquetEmitter({"out_dir": tmp_path})
         emitter.experiment_id = "test_exp"
         emitter.partitioning_path = "path/to/output"
 
@@ -886,8 +882,8 @@ def test_finalize(self, temp_dir):
             assert args[0]["field2"][0] == 20.5
 
         # Test success flag
-        emitter.success = True
-        emitter.finalize()
+        emitter.finalized = False
+        emitter.finalize(success=True)
         assert os.path.exists(
             os.path.join(
                 emitter.out_uri,
@@ -898,8 +894,8 @@ def test_finalize(self, temp_dir):
             )
         )
 
-    def test_multiple_agents(self, temp_dir):
-        emitter = ParquetEmitter({"out_dir": temp_dir})
+    def test_multiple_agents(self, tmp_path):
+        emitter = ParquetEmitter({"out_dir": tmp_path})
         emitter.experiment_id = "test_exp"
         emitter.partitioning_path = "path/to/output"
 
@@ -916,11 +912,12 @@ def test_multiple_agents(self, temp_dir):
         emitter.emit(sim_data)
         assert emitter.num_emits == 0
         assert emitter.buffered_emits == {}
+        emitter.finalized = True
 
-    def test_batch_processing(self, temp_dir):
+    def test_batch_processing(self, tmp_path):
         """Test multiple emits and batch processing."""
         # Small batch size for testing
-        emitter = ParquetEmitter({"out_dir": temp_dir, "batch_size": 3})
+        emitter = ParquetEmitter({"out_dir": tmp_path, "batch_size": 3})
 
         # Configuration emit to initialize variables
         config_data = {
@@ -947,6 +944,7 @@ def test_batch_processing(self, temp_dir):
             sim_data["data"]["agents"]["agent1"]["value"] = i * 10
             emitter.emit(sim_data)
             emitter.last_batch_future.result()
+        emitter.finalized = True
 
         # Verify batch was processed
         assert emitter.num_emits == 4
@@ -957,15 +955,9 @@ def test_batch_processing(self, temp_dir):
 
 
 class TestParquetEmitterEdgeCases:
-    @pytest.fixture
-    def temp_dir(self):
-        """Create a temporary directory for testing."""
-        tmp = tempfile.mkdtemp()
-        yield tmp
-        shutil.rmtree(tmp)
 
     @patch("ecoli.library.parquet_emitter.ThreadPoolExecutor")
-    def test_multithreaded_buffer_clearing(self, mock_executor_class, temp_dir):
+    def test_multithreaded_buffer_clearing(self, mock_executor_class, tmp_path):
         """
         Test to verify that clearing buffers after submitting to ThreadPoolExecutor
         doesn't cause race conditions with the worker thread.
@@ -1006,7 +998,7 @@ def delayed_execution():
         mock_executor_class.return_value = mock_executor
 
         # Initialize the emitter with a small batch size
-        emitter = ParquetEmitter({"out_dir": temp_dir, "batch_size": 2})
+        emitter = ParquetEmitter({"out_dir": tmp_path, "batch_size": 2})
         # Configuration emit to initialize variables
         config_data = {
             "table": "configuration",
@@ -1086,16 +1078,17 @@ def delayed_execution():
         # Changed type for field2 to list so should fail
         with pytest.raises(pl.exceptions.InvalidOperationError):
             emitter.finalize()
+        emitter.finalized = True
         # Cleanup the real executor
         real_executor.shutdown()
 
-    def test_variable_shape_detection_at_boundaries(self, temp_dir):
+    def test_variable_shape_detection_at_boundaries(self, tmp_path):
         """
         Test the fixed vs variable shape field detection logic specifically at
         the boundary points (start of sim, after disk write).
         """
         # Use a small batch size to quickly hit the boundary
-        emitter = ParquetEmitter({"out_dir": temp_dir, "batch_size": 3})
+        emitter = ParquetEmitter({"out_dir": tmp_path, "batch_size": 3})
 
         # Setup: Emit configuration data to intitialize variables
         config_data = {
@@ -1198,6 +1191,7 @@ def test_variable_shape_detection_at_boundaries(self, temp_dir):
         emitter.emit(sim_data4)
 
         emitter.last_batch_future.result()
+        emitter.finalized = True
         t = pl.read_parquet(
             os.path.join(
                 emitter.out_uri,
@@ -1224,12 +1218,12 @@ def test_variable_shape_detection_at_boundaries(self, temp_dir):
             [[1], [2], [3], [4], [5]],
         ]
 
-    def test_expected_failures(self, temp_dir):
+    def test_expected_failures(self, tmp_path):
         """
         Test a few cases that are expected to fail.
         """
         # Use a small batch size to quickly hit the boundary
-        emitter = ParquetEmitter({"out_dir": temp_dir, "batch_size": 3})
+        emitter = ParquetEmitter({"out_dir": tmp_path, "batch_size": 3})
 
         # Setup: Emit configuration data to intitialize variables
         config_data = {
@@ -1394,10 +1388,11 @@ def test_expected_failures(self, temp_dir):
             match=re.escape("cannot parse numpy data type dtype('O')"),
         ):
             emitter.emit(sim_data7)
+        emitter.finalized = True
 
-    def test_nested_nullable(self, temp_dir):
+    def test_nested_nullable(self, tmp_path):
         """Test handling nullable nested types that increase in depth."""
-        emitter = ParquetEmitter({"out_dir": temp_dir, "batch_size": 4})
+        emitter = ParquetEmitter({"out_dir": tmp_path, "batch_size": 4})
         # Configuration emit to initialize variables
         config_data = {
             "table": "configuration",
@@ -1518,6 +1513,7 @@ def test_nested_nullable(self, temp_dir):
         for _ in range(3):
             emitter.emit(sim_data1)
             emitter.last_batch_future.result()
+        emitter.finalized = True
 
         # Check output
         t = pl.read_parquet(
diff --git a/ecoli/library/test_utils.py b/ecoli/library/test_utils.py
new file mode 100644
index 000000000..1fbdd390e
--- /dev/null
+++ b/ecoli/library/test_utils.py
@@ -0,0 +1,99 @@
+
+"""
+Utilities for patching execution environments, configurations and functions.
+"""
+
+
+from abc import ABC, abstractmethod
+from collections.abc import Callable
+from functools import reduce
+from inspect import ismethod
+from unittest.mock import Mock, DEFAULT, _patch, patch
+from typing import Any
+
+import pytest
+
+from ecoli.library.xarray_emitter.utils import WarningFilter
+
+
+# ==============================================================================
+# warnings
+# ==============================================================================
+
+
+def filter_warnings(filters: list[WarningFilter]) -> Callable[[Callable], Callable]:
+    """
+    Analogue of :py:func:`ecoli.library.xarray_emitter.utils.filter_warnings`,
+    but with the effect of applying :py:func:`pytest.mark.filterwarnings`
+    decorators, instead of :py:func:`warnings.filterwarnings` context modifiers.
+    """
+    return (lambda func: reduce(
+        lambda fun, wf: pytest.mark.filterwarnings(str(wf))(fun),
+        filters, func))
+
+
+
+# ==============================================================================
+# config patching
+# ==============================================================================
+
+
+class PatchConfig(ABC):
+    """
+    Test parameter for modifying an already loaded baseline JSON configuration.
+    """
+
+    @abstractmethod
+    def to_dict(self) -> dict[str, Any]:
+        """
+        Materialise changes to the JSON configuration.
+        """
+        ...
+
+
+# ==============================================================================
+# code patching
+# ==============================================================================
+
+
+def patch_func(func: str, *, cb: Callable | None = None) -> _patch:
+    """
+    Create a context manager which patches a module-level function, in order to
+    trace its calls, and to optionally pre-apply a callback.
+
+    .. note::
+      ``func`` is passed as the argument ``target`` to
+      :py:func:`unittest.mock.patch`.
+    """
+    mocked = None
+    def side_effect(*args, **kwargs) -> Any:
+        nonlocal cb, mocked
+        if cb is not None:
+            cb(*args, **kwargs)
+        return mocked.temp_original(*args, **kwargs)  # type: ignore[attr-defined]
+    mocked = patch(func, side_effect=side_effect)
+    return mocked
+
+
+# ------------------------------------------------------------------------------
+
+
+def patch_meth(
+    obj: object, meth: str, *,
+    cb: Callable | None = None, modargs: Callable | None = None
+) -> None:
+    """
+    Patch an object instance method, in order to trace its calls, and to
+    optionally pre-apply a callback or argument modification.
+    """
+    assert ismethod(getattr(obj, meth))
+    assert cb is None or modargs is None
+    def side_effect(*args, **kwargs):
+        nonlocal obj, meth, cb, modargs
+        if modargs is not None:
+            _args, _kwargs = modargs(obj, *args, **kwargs)
+            return getattr(obj, meth)._mock_wraps(*_args, **_kwargs)
+        elif cb is not None:
+            cb(obj, *args, **kwargs)
+        return DEFAULT
+    setattr(obj, meth, Mock(wraps=getattr(obj, meth), side_effect=side_effect))
diff --git a/ecoli/library/xarray_emitter/__init__.py b/ecoli/library/xarray_emitter/__init__.py
new file mode 100644
index 000000000..6ccb43e76
--- /dev/null
+++ b/ecoli/library/xarray_emitter/__init__.py
@@ -0,0 +1,288 @@
+
+r"""
+
+Introduction
+============
+
+:py:class:`.XarrayEmitter` is an :py:class:`~vivarium.core.emitter.Emitter`
+similar to :py:class:`~.ParquetEmitter`, but with a design optimized towards a
+different flavour of downstream applications:
+
+- :py:class:`~.ParquetEmitter` is geared towards emitting a significant fraction
+  of the simulator state, in a format that supports flexible sparse selections,
+  `data reductions`_ and time series visualizations, as used in :ref:`analysis
+  scripts <analysis_scripts>`.
+- :py:class:`.XarrayEmitter` is intended for emitting only a pre-selected subset
+  of statically shaped tensor variables, in a format that supports numerical
+  algorithms in the high-dimensional and large-sample regime.
+
+The former type of computations is naturally expressed using `relational query`_
+engines (e.g., :ref:`DuckDB <parquet_read>`), whereas the latter type is
+naturally expressed using `array programming`_ libraries (e.g., `Cubed`_). Due
+to the sheer size of the simulator state, both types may in general require
+`out-of-core processing`_ algorithms.
+
+.. _data reductions: https://en.wikipedia.org/wiki/Data_reduction
+.. _relational query: https://en.wikipedia.org/wiki/Relational_database
+.. _array programming: https://en.wikipedia.org/wiki/Array_programming
+.. _Cubed: https://cubed-dev.github.io/cubed/why-cubed.html
+.. _out-of-core processing: https://en.wikipedia.org/wiki/External_memory_algorithm
+
+In order to facilitate downstream applications based on chunked array
+processing, :py:class:`.XarrayEmitter` writes out to any persistent storage
+supporting the `Zarr`_ specification, using an in-memory buffer comprised of
+`Xarray`_ objects. For optimized throughput, the buffer implements temporal
+subsampling, numerical type casting and compression codecs at emission time.
+Furthermore, in order to simplify the export of simulation data into external
+libraries, the hierarchy of the output `DataTree`_ is decoupled from the
+hierarchy of simulation :py:class:`~vivarium.core.store.Store`\ s, using an
+output :ref:`variable layout <variable_layout>` specified in the :ref:`simulator
+configuration <sim_config>`.
+
+.. _Xarray: https://xarray.dev/
+.. _Zarr: https://zarr.dev/
+.. _DataTree: https://docs.xarray.dev/en/stable/user-guide/data-structures.html#datatree
+
+
+Comparison with :py:class:`~.ParquetEmitter`
+============================================
+
+Similarities
+------------
+
+- Currently only supports simulations of a *single-cell lineage* per
+  :py:class:`.BufferedEmitter` instance.
+- Executes at every time step.
+- Buffers emissions into time chunks.
+- Uses concurrent threads for writing buffers to persistent storage.
+- Produces a hierarchically structured storage layout that supports selective
+  reading in downstream applications.
+
+Differences in usage
+--------------------
+
+- Supports the configuration of *emission predicates*.
+- Currently only supports emitting a *static collection* of *statically shaped
+  tensor variables*.
+- Supports *renaming and rearranging* of output variables.
+- Requires the configuration of *output data types*.
+- Supports the configuration of backend-specific *compression codecs*.
+- Supports :ref:`log_updates`, i.e., the emission of individual
+  :py:class:`~vivarium.core.process.Process` update requests, before they are
+  aggregated and reallocated by
+  :py:func:`~ecoli.processes.allocator.calculatePartition` and then applied to
+  the global cell state by
+  :py:meth:`~ecoli.processes.partition.PartitionedProcess.evolve_state`.
+
+.. note::
+  See :py:class:`.XarrayEmitter` for an explanation of the JSON configuration
+  syntax, and ``configs/test_configs/test_xarray_emitter.json`` for a complete
+  example.
+
+.. hint::
+  As data structures, `DataTree`_\ s could support changes of variable names and
+  dimensions across time steps. The constraints currently imposed by
+  :py:class:`.XarrayEmitter` rather serve to enable I/O optimizations for the
+  intended use cases. When access to variably sized simulation variables is
+  desired, users have the choice either of implementing custom :ref:`listeners
+  <listeners>` with static output coordinates, or otherwise of defaulting to the
+  :py:class:`~.ParquetEmitter`.
+
+Differences in implementation
+-----------------------------
+
+- Uses the `Xarray`_ API for serialization, buffering, and `metadata
+  organization`_, including unit annotations (see :py:class:`.VariableSpec` and
+  :py:class:`.XarrayTransducer` for details).
+- Applies a "*process*-major" rather than a "*generation*-major" output layout,
+  reflecting array variables directly in the output directory tree; this
+  produces one file per *variable* time chunk, rather than one file per
+  *simulation* time chunk (compare the :py:class:`.XarrayEmitter` :ref:`storage
+  layout <storage_layout>` with :py:meth:`.ParquetEmitter.emit`; see
+  :py:class:`.XarrayStoragePartition` for details).
+- Defines the abstract interface :py:class:`.AsyncBufferWriter` for storage
+  backends with *asynchronous* APIs (currently supported: `Zarr`_), realizing
+  the opportunity for :ref:`concurrency <concurrency>` among multiple
+  `DataArray`_\ s within an output buffer.
+- Decouples the in-memory buffer size from the persistent chunk size, in order
+  to simplify performance tuning of large-scale simulations (see
+  :py:class:`.XarrayTransducer` and :py:class:`.AsyncBufferWriter` for details).
+- Maintains `consolidated metadata`_ and updates it at the end of each simulated
+  cell generation, in order to reduce the metadata loading latency for
+  subsequent storage reads (see :py:class:`.AsyncZarrBufferWriter` for details).
+
+.. _metadata organization: https://docs.xarray.dev/en/stable/get-help/faq.html#approach-to-metadata
+.. _DataArray: https://docs.xarray.dev/en/stable/user-guide/data-structures.html#dataarray
+.. _consolidated metadata: https://docs.xarray.dev/en/stable/user-guide/io.html#io-zarr-consolidated-metadata
+
+
+.. _storage_layout:
+
+Storage layout
+==============
+
+The workflow storage layout, which comprises many individual simulations, is
+currently organized as follows --- where file paths in this example are specific
+to the Zarr v3 storage backend::
+
+  {store}                                         ;  <root>
+  ├─ zarr.json                                    ;    metadata
+  └─ experiment_id={}/variant={}/lineage_seed={}  ;    <independent substore>
+     ├─ zarr.json                                 ;      consolidated metadata
+     ├─ emitstep_gen={}                           ;      <time coordinate>
+     │  ├─ zarr.json                              ;        metadata
+     │  └─ c/...                                  ;        chunked array
+     ├─ time_gen={}                               ;      <time values>
+     │  ├─ zarr.json                              ;        metadata
+     │  └─ c/...                                  ;        chunked array
+     └─ {path/to/variable}                        ;      <variable layout>
+        ├─ zarr.json                              ;        metadata
+        ├─ id_{variable}                          ;        <variable coordinate>
+        │  ├─ zarr.json                           ;          metadata
+        │  └─ c/...                               ;          chunked array
+        └─ generation={}                          ;        <variable values>
+           ├─ zarr.json                           ;          metadata
+           └─ c/...                               ;          chunked array
+
+This design is motivated by the following considerations:
+
+  - Using relative paths inside a global store simplifies the authentication,
+    configuration and resource management of file system providers during highly
+    parallel, long-running simulation workflows.
+  - An :py:attr:`.XarrayStoragePartition.independent_path` locates a logically
+    self-contained substore, which maintains its own `consolidated metadata`_
+    without communicating to other substores.
+  - Fine-grained control over storage footprint, variable selection, latency and
+    throughput, both during emission and during post-processing, is enabled by
+    distinguishing *at the file system level* among simulation variables, as
+    well as between metadata, coordinate data and variable data. In particular:
+
+    - Chunk sizes and compression codecs can be configured for each variable.
+    - By leveraging `inheritance`_ inside an independent substore, each
+      generation's time coordinate is shared across the generation's variables,
+      and each variable coordinate is shared across all generations.
+
+.. note::
+  In order to fully benefit from consolidated metadata, downstream applications
+  should open independent substores directly, i.e., based on their known
+  relative file system paths, rather than by first loading all metadata for the
+  global store. This can be achieved, e.g., by calling
+  :py:func:`xarray.open_datatree` only on substores, or by using lower-level
+  APIs such as :py:func:`zarr.open_group`.
+
+  An alternative would be to perform metadata consolidation on the global store
+  at the end of an entire workflow, e.g., by calling
+  :py:func:`zarr.consolidate_metadata` for the Zarr storage backend. However,
+  this may be an expensive operation accessing a large number of files, and
+  would, for the `zarr-python`_ implementation at the time of writing, ignore
+  the already incrementally consolidated metadata in independent substores.
+
+.. _inheritance: https://docs.xarray.dev/en/stable/user-guide/hierarchical-data.html#alignment-and-coordinate-inheritance
+.. _zarr-python: https://github.com/zarr-developers/zarr-python
+
+
+.. _variable_layout:
+
+Variable layout
+===============
+
+For each individual :py:class:`.EcoliSim` simulation, the mapping from the
+Vivarium simulation hierarchy (:py:class:`~vivarium.core.store.Store`) to the
+Xarray output hierarchy (:py:class:`~xarray.DataTree`) is configured using three
+levels of grouping::
+
+  ForestView      ;  specifies a full `xarray.DataTree`
+  └─ TreeView     ;  specifies a partial `xarray.DataTree`
+     └─ LeafView  ;  specifies a single `xarray.DataArray`
+
+A :py:class:`.LeafView` corresponds to a single array variable emitted by
+Vivarium, a :py:class:`.TreeView` collects :py:class:`.LeafView`\ s whose
+metadata paths share a common root, and a :py:class:`.ForestView` is a group of
+:py:class:`.TreeView`\ s within a single ``agent_id`` (see :ref:`Configuration
+<sim_config>`).
+
+
+Software architecture
+=====================
+
+:py:class:`.XarrayEmitter` is in essence a `finite-state transducer`_, and its
+state factors through the following object ownership relations::
+
+  .XarrayEmitter(BufferedEmitter)                     ;  <application layer>
+  ├─ .XarrayTransducer                                ;    <presentation layer>
+  │  ├─ .ConjunctiveEmitPredicate                     ;      emission criterion
+  │  └─ .XarrayBuffer                                 ;      output buffer
+  │     ├─ .ForestView                                ;        variable layout
+  │     ├─ xarray.DataTree                            ;        memory layout
+  │     └─ .XarrayStoragePartition(StoragePartition)  ;        storage layout
+  └─ .AsyncZarrBufferWriter(AsyncBufferWriter)        ;    <session layer>
+     └─ xarray.backends.ZarrStore                     ;      <transport layer>
+        └─ zarr.Group                                 ;        persistent storage
+
+.. _finite-state transducer: https://en.wikipedia.org/wiki/Finite-state_transducer
+
+
+.. _concurrency:
+
+Concurrency
+===========
+
+The current design employs two levels of concurrency per :py:class:`~.EcoliSim`
+OS process::
+
+  [main thread]       ;  XarrayEmitter.flush()
+  └─ [writer thread]  ;  AsyncBufferWriter._write()
+     └─ [coroutine]   ;  AsyncArrayWriter._async()
+
+Each time the :py:class:`.XarrayBuffer` is filled up, the writer thread receives
+a :py:meth:`~concurrent.futures.Executor.submit` call from the main thread (see
+:py:meth:`.AsyncBufferWriter.write`). In turn, the writer thread executes a
+`coroutine`_ that leverages a backend-specific API for asynchronously executing
+the low-level write operations required for persisting the buffer contents (see
+:py:class:`.AsyncArrayWriter`).
+
+.. _coroutine: https://docs.python.org/3/howto/a-conceptual-overview-of-asyncio.html
+
+This design is motivated by the following observations at the time of writing:
+
+  - In the typical use case of :py:class:`.XarrayEmitter`,
+    :math:`10^2`--:math:`10^5`
+    :py:class:`~ecoli.experiments.ecoli_master_sim.EcoliSim` instances are
+    executed in parallel, on a single core each.
+  - The multiplicity of *bandwidth*-consuming arrays in each
+    :py:class:`.XarrayBuffer` provides an opportunity for concurrency, even
+    though on typical compute environments, the *latency* of the transport layer
+    in the :py:class:`.AsyncBufferWriter` is assumed to be at least 3 orders of
+    magnitude smaller than the simulation time required to fill an
+    :py:class:`.XarrayBuffer`. This is particularly relevant if many parallel
+    simulations in an HPC environment are flushing their buffers at correlated
+    wall-clock times.
+  - Since using many threads per
+    :py:class:`~ecoli.experiments.ecoli_master_sim.EcoliSim` OS process would
+    slow down the simulation, and since using many concurrent connections per
+    :py:class:`~ecoli.experiments.ecoli_master_sim.EcoliSim` OS process would
+    congest the transport layer, the optimal choice is expected to be a small
+    integer for both resource parameters.
+  - The :py:mod:`~zarr.api.asynchronous` API was `central to the design`_ of
+    `zarr-python`_ 3.
+  - In Xarray, library support for ``async`` calls to storage backends is `still
+    in flux`_. In particular, :py:class:`xarray.backends.ZarrStore` does not yet
+    fully reflect Zarr's ``async`` API, with current support for asynchronous
+    writing `tied`_ to a `chunked array library`_ via
+    :py:class:`xarray.namedarray.parallelcompat.ChunkManagerEntrypoint`,
+    including in a recent `proof-of-concept`_.
+
+.. hint::
+  - The numbers of threads and concurrent connections in the transport layer
+    have backend-specific configuration options (see
+    :py:class:`~.zarr_writer.AsyncZarrBufferWriter`).
+  - Threading in the session layer can be disabled for debugging purposes (see
+    :py:class:`.AsyncBufferWriter`).
+
+.. _central to the design: https://zarr.readthedocs.io/en/v3.0.8/developers/roadmap.html#async-api
+.. _still in flux: https://github.com/pydata/xarray/issues/10622
+.. _tied: https://github.com/pydata/xarray/pull/10625
+.. _chunked array library: https://docs.xarray.dev/en/stable/internals/chunked-arrays.html
+.. _proof-of-concept: https://github.com/pydata/xarray/pull/11171
+
+"""
diff --git a/ecoli/library/xarray_emitter/emit_path.py b/ecoli/library/xarray_emitter/emit_path.py
new file mode 100644
index 000000000..7718d7b11
--- /dev/null
+++ b/ecoli/library/xarray_emitter/emit_path.py
@@ -0,0 +1,136 @@
+
+"""
+Structural assumptions made by :py:class:`.XarrayBuffer` about schema paths of
+emitted variables.
+
+.. note::
+  Adding support for a new metadata provider or a new kind of
+  non-:py:class:`~vivarium.core.store.Store` emit path will involve extending
+  :py:class:`.EmitPath` and :py:class:`.TreeView`.
+"""
+
+
+from __future__ import annotations
+
+from dataclasses import dataclass, field
+from enum import Flag, auto
+
+from vivarium.core.types import HierarchyPath
+
+
+# ==============================================================================
+# emit paths
+# ==============================================================================
+
+
+class EmitPathType(Flag):
+    r"""
+    Type information for :py:data:`~vivarium.core.types.HierarchyPath`\ s, as
+    determined in the constructor of :py:class:`.EmitPath`.
+    """
+
+    agent = auto()
+    """
+    Absolute path prefix until ``agent_id``. Other paths wrapped by
+    :py:class:`.EmitPath` are relative to an agent.
+    """
+    listener = auto()
+    """
+    Relative path to a ``("listener", ...)``
+    :py:class:`~vivarium.core.store.Store` created by
+    :py:func:`~ecoli.library.schema.listener_schema`.
+    """
+    update = auto()
+    r"""
+    Relative path to a ``("log_update", ...)``
+    :py:class:`~vivarium.core.store.Store` created by
+    :py:func:`~ecoli.library.logging_tools.make_logging_process`. The output
+    tree from such a store does not map onto a source tree of
+    :py:class:`~vivarium.core.store.Store`\ s, and hence does not support
+    internal ``emit`` flags.
+    """
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @property
+    def is_agent(self) -> bool:
+        return self.agent in self  # type: ignore[operator]
+
+    @property
+    def is_listener(self) -> bool:
+        return self.listener in self  # type: ignore[operator]
+
+    @property
+    def is_update(self) -> bool:
+        return self.update in self  # type: ignore[operator]
+
+    @property
+    def is_update_listener(self) -> bool:
+        return (self.listener | self.update) in self  # type: ignore[operator]
+
+
+# ------------------------------------------------------------------------------
+
+
+@dataclass
+class EmitPath:
+    """
+    Wrapper data class for an absolute or relative
+    :py:data:`~vivarium.core.types.HierarchyPath` that locates a variable
+    emitted by :py:meth:`!vivarium.core.engine.Engine._emit_store_data`. Such a
+    path is composed of:
+
+      1. *always* a path to a :py:class:`~vivarium.core.store.Store`,
+      2. and *possibly* a suffix path inside a schema dictionary that is emitted
+         from (1).
+    """
+
+    type: EmitPathType = field(init=False)
+    path: HierarchyPath
+
+    def __post_init__(self) -> None:
+        assert all(isinstance(p, str) for p in self.path)
+        self.path = tuple(self.path)
+        self.type = EmitPathType(0)
+        if "agents" in self.path:
+            assert self.path[0] == "agents"
+            assert "agents" not in self.path[1:]
+            self.type |= EmitPathType.agent
+        if "listeners" in self.path:
+            self.type |= EmitPathType.listener
+        if "log_update" in self.path:
+            assert self.path[0] == "log_update"
+            assert "log_update" not in self.path[1:]
+            self.type |= EmitPathType.update
+        if self.type.is_agent:
+            assert not (self.type.is_listener or self.type.is_update)
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @property
+    def emitting_path(self) -> HierarchyPath:
+        """
+        Path to the responsible :py:class:`~vivarium.core.store.Store`. This is
+        always a prefix of :py:attr:`.path`, and identical to :py:attr:`.path`
+        if :py:attr:`.path` points to a :py:class:`~vivarium.core.store.Store`.
+        """
+        assert not self.type.is_agent
+        if self.type.is_update_listener:
+            return self.path[:self.path.index("listeners")]
+        else:
+            return self.path
+
+    @property
+    def metadata_path(self) -> HierarchyPath:
+        """
+        Corresponding path within the result of
+        :py:meth:`ecoli.experiments.ecoli_master_sim.EcoliSim.output_metadata`.
+        """
+        if not self.type.is_update_listener:
+            # access process metadata
+            return ()
+        elif EmitPathType.listener in self.type:
+            # access listener metadata
+            return ("listeners",)
+        else:
+            raise NotImplementedError(f"Metadata access for:\n  {self}")
diff --git a/ecoli/library/xarray_emitter/emit_predicate.py b/ecoli/library/xarray_emitter/emit_predicate.py
new file mode 100644
index 000000000..560db392a
--- /dev/null
+++ b/ecoli/library/xarray_emitter/emit_predicate.py
@@ -0,0 +1,225 @@
+
+"""
+Predicates used by :py:class:`.XarrayTransducer` to decide which *simulation
+steps* will produce *emit steps*. Predicates are represented as formulas in
+`conjunctive normal form`_ (CNF), where literals are atomic predicates
+parametrized by the JSON configuration.
+
+.. _conjunctive normal form: https://en.wikipedia.org/wiki/Conjunctive_normal_form
+"""
+
+
+from __future__ import annotations
+
+from abc import ABC, abstractmethod
+from dataclasses import dataclass
+from typing import Any, Self, final
+
+from .utils import emitter_arg_error
+
+
+# ==============================================================================
+# abstract atomic predicate
+# ==============================================================================
+
+
+class AtomicEmitPredicate(ABC):
+    """
+    An atomic predicate type over simulation steps, which is parametrized by a
+    JSON configuration.
+
+    Example JSON configuration::
+
+      {"subsample": {"interval": 10}}
+
+    Here, the single top-level key determines the predicate subtype, and the
+    single top-level value constitutes its parameters.
+    """
+
+    @classmethod
+    def build(cls, config: dict[str, Any]) -> AtomicEmitPredicate:
+        """
+        Instantiate the subclass.
+        """
+        match config:
+            case dict() if len(config) == 1:
+                (ty, param), = config.items()
+                match ty:
+                    case "fixed":
+                        return FixedSteps(**param)
+                    case "subsample":
+                        return SubsampleSteps(**param)
+                    case _:
+                        raise TypeError(emitter_arg_error(
+                            cls, "Unsupported predicate type",
+                            f"\"predicate\": [[{config}]]"))
+            case _:
+                raise TypeError(emitter_arg_error(
+                    cls, "Invalid argument", f"\"predicate\": [[{config}]]"))
+
+    @abstractmethod
+    def __call__(self, sim_tix: int, t: float, data: dict[str, Any], /) -> bool:
+        """
+        Evaluate the predicate for a simulation step.
+
+        Args:
+          sim_tix: :py:attr:`.XarrayTransducer.sim_tix`.
+          t:       Simulation time stamp.
+          data:    Input received from :py:meth:`!Engine._emit_store_data`.
+        """
+        ...
+
+
+# ==============================================================================
+# composite predicates
+# ==============================================================================
+
+
+@dataclass(slots=True, frozen=True)
+class DisjunctiveEmitPredicate:
+    """
+    A disjunctive clause whose literals are atomic predicates.
+
+    Example JSON configuration::
+
+      [...]
+
+    Here, each entry in the JSON array is parsed by
+    :py:class:`.AtomicEmitPredicate`.
+    """
+
+    atoms: list[AtomicEmitPredicate]
+
+    def __post_init__(self) -> None:
+        assert isinstance(self.atoms, list)
+        assert all(isinstance(p, AtomicEmitPredicate) for p in self.atoms)
+
+    @classmethod
+    def build(cls, config: list[dict[str, Any]]) -> Self:
+        if not isinstance(config, list):
+            raise TypeError(emitter_arg_error(
+                cls, "Invalid argument", f"\"predicate\": [{config}]"))
+        return cls(list(map(AtomicEmitPredicate.build, config)))
+
+    @abstractmethod
+    def __call__(self, sim_tix: int, t: float, data: dict[str, Any], /) -> bool:
+        """
+        Evaluate the predicate for a simulation step.
+
+        Calls: :py:meth:`.AtomicEmitPredicate.__call__`.
+
+        Args:
+          sim_tix: :py:attr:`.XarrayTransducer.sim_tix`.
+          t:       Simulation time stamp.
+          data:    Input received from :py:meth:`!Engine._emit_store_data`.
+        """
+        return any(p(sim_tix, t, data) for p in self.atoms)
+
+
+# ------------------------------------------------------------------------------
+
+
+@dataclass(slots=True, frozen=True)
+class ConjunctiveEmitPredicate:
+    """
+    A conjuctive formula over disjunctive clauses.
+
+    Example JSON configuration::
+
+      [...]
+
+    Here, each entry in the JSON array is parsed by
+    :py:class:`.DisjunctiveEmitPredicate`.
+    """
+
+    clauses: list[DisjunctiveEmitPredicate]
+
+    def __post_init__(self) -> None:
+        assert isinstance(self.clauses, list)
+        assert all(isinstance(c, DisjunctiveEmitPredicate) for c in self.clauses)
+
+    @classmethod
+    def build(cls, config: list[list[dict[str, Any]]]) -> Self:
+        if not isinstance(config, list):
+            raise TypeError(emitter_arg_error(
+                cls, "Invalid argument", f"\"predicate\": {config}"))
+        return cls(list(map(DisjunctiveEmitPredicate.build, config)))
+
+    @abstractmethod
+    def __call__(self, sim_tix: int, t: float, data: dict[str, Any], /) -> bool:
+        """
+        Evaluate the predicate for a simulation step.
+
+        Calls: :py:meth:`.DisjunctiveEmitPredicate.__call__`.
+
+        Args:
+          sim_tix: :py:attr:`.XarrayTransducer.sim_tix`.
+          t:       Simulation time stamp.
+          data:    Input received from :py:meth:`!Engine._emit_store_data`.
+        """
+        return all(c(sim_tix, t, data) for c in self.clauses)
+
+
+# ==============================================================================
+# concrete predicates
+# ==============================================================================
+
+
+@final
+@dataclass(kw_only=True, slots=True)
+class FixedSteps(AtomicEmitPredicate):
+    """
+    An atomic predicate which selects a statically known set of simulation
+    steps.
+
+    Example JSON configuration::
+
+      {"fixed": {"steps": [0]}}
+
+    Here, ``steps`` is a list of integer-valued simulation steps.
+    """
+
+    steps: list[int]
+
+    def __post_init__(self) -> None:
+        match self.steps:
+            case list(steps) if all(isinstance(s, int) and s >= 0 for s in steps):
+                self.steps = sorted(self.steps)
+            case steps:
+                raise ValueError(emitter_arg_error(
+                    self, "Invalid argument",
+                    f"\"predicate\": [[{{\"fixed\": {{\"steps\": {steps}}}}}]]"))
+
+    def __call__(self, sim_tix: int, t: float, data: dict[str, Any], /) -> bool:
+        if self.steps and (sim_tix == self.steps[0]):
+            self.steps.pop(0)
+            return True
+        else:
+            return False
+
+@final
+@dataclass(kw_only=True, slots=True, frozen=True)
+class SubsampleSteps(AtomicEmitPredicate):
+    """
+    An atomic predicate which selects a regular time grid.
+
+    Example JSON configuration::
+
+      {"subsample": {"interval": 10}}
+
+    Here, ``interval`` is an integer number of simulation steps.
+    """
+
+    interval: int
+
+    def __post_init__(self) -> None:
+        match self.interval:
+            case int(i) if i >= 1:
+                pass
+            case i:
+                raise ValueError(emitter_arg_error(
+                    self, "Invalid argument",
+                    f"\"predicate\": [[{{\"subsample\": {{\"interval\": {i}}}}}]]"))
+
+    def __call__(self, sim_tix: int, t: float, data: dict[str, Any], /) -> bool:
+        return sim_tix % self.interval == 0
diff --git a/ecoli/library/xarray_emitter/emitter.py b/ecoli/library/xarray_emitter/emitter.py
new file mode 100644
index 000000000..0f8f1c8a0
--- /dev/null
+++ b/ecoli/library/xarray_emitter/emitter.py
@@ -0,0 +1,233 @@
+
+"""
+See :py:mod:`.xarray_emitter`.
+"""
+
+
+from __future__ import annotations
+
+from datetime import datetime
+from pathlib import Path
+from pprint import pp
+from typing import Any, final
+
+from vivarium.core.types import HierarchyPath
+from vivarium.core.engine import Engine
+from vivarium.core.store import Store
+
+from ..emitter import BufferedEmitter
+from .transducer import XarrayTransducer
+from .storage import XarrayStoragePartition
+from .writer import AsyncBufferWriter
+from .utils import emitter_arg_error
+
+
+# ==============================================================================
+
+
+@final
+class XarrayEmitter(BufferedEmitter):
+    """
+    Entry point for :py:mod:`.xarray_emitter`.
+
+    This is a wrapper around :py:class:`.XarrayTransducer`, and is mainly
+    responsible for:
+
+      - Propagating configurations.
+      - Coupling to :py:class:`~vivarium.core.engine.Engine` via the
+        :py:class:`.BufferedEmitter` interface.
+      - Connecting :py:class:`.XarrayTransducer` to
+        :py:class:`.AsyncBufferWriter`.
+
+    Example JSON configuration::
+
+      {
+        "emitter": "xarray",
+        "emitter_arg": {
+          "transducer": {...},
+          "view": [...],
+          "writer": {...}
+        }
+      }
+
+    Here,
+
+      - ``transducer`` is parsed by :py:class:`.XarrayTransducer`,
+      - ``view`` is parsed by :py:class:`.ForestView`,
+      - and ``writer`` is parsed by :py:class:`.AsyncBufferWriter`.
+
+    For a complete example, see
+    ``configs/test_configs/test_xarray_emitter.json``.
+    """
+
+    __slots__ = ("transducer", "writer", "finalized", "debug")
+
+    metadata_keys = [
+        'experiment_id', 'description', 'sim_data_path', 'time',
+        'suffix_time', 'time_step', 'initial_global_time',
+        'max_duration', 'fail_at_max_duration',
+        'lineage_seed', 'seed', 'variants', 'n_init_sims', 'generations',
+        'agent_id', 'parallel',
+        'skip_baseline', 'log_updates',
+        'single_daughters', 'daughter_outdir',
+        'fixed_media', 'condition',
+        'parca_options',
+        'mar_regulon', 'amp_lysis',
+        'divide', 'd_period', 'division_threshold', 'division_variable',
+        'chromosome_path',
+    ]
+    """
+    The subset of metadata selected by :py:meth:`.extract_metadata`.
+    """
+
+    def __init__(self, config: dict[str, Any], /) -> None:
+        self.validate_config(config)
+        self.debug: bool = config.get("debug", False)
+        """ Flag for debug-level printing. Defaults to ``False``. """
+        self.transducer: XarrayTransducer = XarrayTransducer(config, debug=self.debug)
+        """ Presentation layer. """
+        self.writer: AsyncBufferWriter = AsyncBufferWriter.dispatch(config["writer"])
+        """ Session layer. """
+        super().__init__()
+
+    @classmethod
+    def validate_config(cls, config: dict[str, Any], /) -> None:
+        """
+        Check assumptions about static emitter configuration.
+        """
+        for key in ["transducer", "view", "writer"]:
+            if key not in config:
+                raise KeyError(emitter_arg_error(
+                    cls, "Missing argument", f"\"{key}\": ..."))
+        match config.get("debug", False):
+            case bool():
+                pass
+            case debug:
+                raise TypeError(emitter_arg_error(
+                    cls, "Invalid argument", f"\"debug\": {debug}"))
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @classmethod
+    def validate_metadata(cls, metadata: dict[str, Any], /) -> None:
+        """
+        Check assumptions about static simulator configuration.
+        """
+        expected = {
+            "single_daughters": True,
+            "save": False,
+            "save_times": False,
+            "emit_config": False,
+            "emit_topology": False,
+            "emit_processes": False,
+            "emit_unique": False,
+        }
+        for (k, v) in expected.items():
+            if bool(w := metadata[k]) != v:
+                raise ValueError(
+                    f"\n  Config argument unsupported by {cls.__name__}:"
+                    f"\n    {{\"{k}\": {w}}}")
+
+    def extract_partition(self, metadata: dict[str, Any], /) -> XarrayStoragePartition:
+        return XarrayStoragePartition.cast(super().extract_partition(metadata))
+
+    def extract_metadata(self, metadata: dict[str, Any], /) -> dict[str, Any]:
+        """
+        While executing :py:meth:`!Engine._emit_configuration` during
+        :py:meth:`!Engine.__init__`, select and transform the subset of
+        simulation metadata that will be stored by :py:class:`.XarrayEmitter`,
+        starting from the :py:attr:`!Engine.metadata` that have been populated
+        by :py:meth:`.EcoliSim.run`.
+        """
+        _metadata = {k: metadata[k] for k in self.metadata_keys}
+        # reduce to basic JSON types
+        for (k, v) in _metadata.items():
+            match v:
+                case Path():
+                    _metadata[k] = str(v)
+                case datetime():
+                    # store the timestamp created by `EcoliSim.get_metadata()`,
+                    # rather than the one created by `Engine.__init__()`
+                    _metadata[k] = str(v.astimezone())
+        if self.debug:
+            hline = "-" * 79
+            print(f"\nMetadata:\n{hline}")
+            pp(_metadata)
+            print(hline)
+        return _metadata
+
+    @staticmethod
+    def extract_coords(metadata: dict[str, Any], /) -> dict[str, Any]:
+        """
+        While executing :py:meth:`!Engine._emit_configuration` during
+        :py:meth:`!Engine.__init__`, extract the port schemas that have been
+        populated by :py:meth:`.EcoliSim.output_metadata`.
+        """
+        return metadata["output_metadata"]
+
+    @property
+    def partition(self) -> XarrayStoragePartition:
+        """
+        Reference to :py:attr:`.XarrayBuffer.partition`.
+        """
+        return self.transducer.buffer.partition
+
+    def flush(self, *, final=False) -> None:
+        """
+        Calls: :py:meth:`.AsyncBufferWriter.write`.
+        """
+        self.writer.write(self.transducer, final=final)
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    def reset_emit_flags(
+        self, *,
+        engine: Engine, agent: HierarchyPath, emit_paths: tuple[HierarchyPath]
+    ) -> None:
+        """
+        In this subclass, ``agent`` is required and ``emit_paths`` is expected
+        to be empty.
+        """
+        assert engine.emitter is self
+        if emit_paths:
+            raise KeyError(
+                "For {\"emitter\": \"xarray\"}, please provide:\n"
+                "  {\"emitter_arg\": {\"view\": ...}}\n"
+                "  instead of\n"
+                "  {\"emit_paths\": ...}")
+        engine.state.set_emit_value(
+            emit=False, path=tuple())
+        assert isinstance(agent_state := engine.state.get_path(agent), Store)
+        agent_state.set_emit_values(
+            emit=True, paths=self.transducer.buffer.view.emitting_paths)
+
+    def emit(self, data: dict[str, Any], /):
+        """
+        Main method.
+
+        Calls: :py:meth:`.XarrayTransducer.step` and possibly :py:meth:`.flush`.
+        """
+        header, payload = data["table"], data["data"]
+        match header:
+            # sender: `Engine._emit_configuration()`
+            case "configuration":
+                self.validate_metadata(metadata := payload["metadata"])
+                self.transducer.alloc(
+                    partition=self.extract_partition(metadata),
+                    metadata=self.extract_metadata(metadata),
+                    coords=self.extract_coords(metadata))
+                self.writer.open_store(self.transducer.buffer)
+            # sender: `Engine._emit_store_data()`
+            case "history":
+                if not self.transducer.step(payload):
+                    self.flush()
+                    self.transducer.shift()
+                    assert self.transducer.step(payload)
+            case _:
+                raise ValueError(f"Unexpected emit type: {header}")
+
+    def _finalize(self, *, success: bool) -> None:
+        self.flush(final=True)
+        if success:
+            self.writer.mark_success()
+        self.writer.close()
diff --git a/ecoli/library/xarray_emitter/storage.py b/ecoli/library/xarray_emitter/storage.py
new file mode 100644
index 000000000..c20c6447e
--- /dev/null
+++ b/ecoli/library/xarray_emitter/storage.py
@@ -0,0 +1,369 @@
+
+"""
+Constants and parameters defining the output :ref:`storage <storage_layout>` and
+:ref:`variable <variable_layout>` layouts.
+"""
+
+
+from __future__ import annotations
+
+from dataclasses import dataclass, field, fields
+from functools import cached_property
+from pathlib import Path
+from typing import Any, Self, TYPE_CHECKING
+
+import numpy as np
+from xarray import Dataset
+from xarray.core.datatree import NodePath
+
+from ..emitter import StoragePartition
+
+if TYPE_CHECKING:
+    from .writer import AsyncBufferWriter
+
+
+# ==============================================================================
+# constants
+# ==============================================================================
+
+
+TIME_COO_PREFIX = "emitstep_"
+""" Prefix for :py:attr:`.XarrayStoragePartition.time_coo_name`. """
+TIME_VAR_PREFIX = "time_"
+""" Prefix for :py:attr:`.XarrayStoragePartition.time_var_name`. """
+VAR_COO_PREFIX = "id_"
+""" Prefix for :py:attr:`.VariableSpec.var_coo_name`. """
+LOG_ATTR_PREFIX = "last_write_"
+""" Prefix for :py:attr:`.XarrayStoragePartition.log_attr_name`. """
+SUCCESS_ATTR_PREFIX = "division_reached_"
+""" Prefix for :py:attr:`.XarrayStoragePartition.success_attr_name`. """
+
+TIME_COO_DTYPE = np.dtype(np.uint32)
+""" Data type for :py:attr:`.XarrayStoragePartition.time_coo_name`. """
+TIME_VAR_DTYPE = np.dtype(np.float32)
+""" Data type for :py:attr:`.XarrayStoragePartition.time_var_name`. """
+
+
+# ==============================================================================
+# Xarray storage layout
+# ==============================================================================
+
+
+@dataclass(eq=True, kw_only=True)
+class XarrayStoragePartition(StoragePartition):
+    """
+    Relative storage paths and coordinate names used by
+    :py:class:`.XarrayEmitter` to place the output from a single-generation
+    :py:class:`.EcoliSim` within a workflow store.
+
+    See :ref:`storage_layout` for the design rationale.
+    """
+
+    @classmethod
+    def cast(cls, partition: StoragePartition) -> Self:
+        assert isinstance(partition, StoragePartition)
+        return cls(**{f.name: getattr(partition, f.name)
+                      for f in fields(partition) if f.init})
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @cached_property
+    def independent_path(self) -> Path:
+        """
+        The most specific location within a workflow store that has the
+        following properties:
+
+        - It holds a *stochastically independent* simulation subensemble.
+        - It is *representationally independent*.
+
+        A simulation subensemble is considered *stochastically independent* if
+        no numerical values from other subensembles are involved in its
+        simulation; Note that this concern is separate from the choices of
+        software versions and parameters, which are coupled at the project
+        level. A substorage is *representationally independent* if it is
+        self-contained in terms of semantic coordinate annotations, and if it
+        does not rely on any external synchronisation mechanism for maintaining
+        the consistency of its storage layout metadata.
+        """
+        return Path(*(f"{k}={getattr(self, k)}" for k in
+                      ["experiment_id", "variant", "lineage_seed"]))
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @cached_property
+    def dynamic_suffix(self) -> str:
+        """
+        Uniquely identifying suffix path for variables which occur in multiple
+        realisations within an independent substore.
+        """
+        return str(NodePath(*(f"{k}={getattr(self, k)}" for k in
+                              ["generation"])))
+
+    @cached_property
+    def sim_id(self) -> str:
+        """
+        Suffix used in :py:attr:`.time_coo_name`. This information is logically
+        equivalent to :py:attr:`.dynamic_suffix`.
+        """
+        return f"gen={self.generation}"
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @cached_property
+    def time_coo_name(self) -> str:
+        r"""
+        Name of the integer-valued `Xarray dimension coordinate`_ for the
+        current simulation that is located in the root node of the output
+        :py:class:`~xarray.DataTree`. All emitted `Xarray data variable`_\ s
+        inherit this dimension coordinate, including :py:attr:`.time_var_name`.
+
+        .. _Xarray data variable: https://docs.xarray.dev/en/stable/user-guide/terminology.html#term-Variable
+        .. _Xarray dimension coordinate: https://docs.xarray.dev/en/stable/user-guide/terminology.html#term-Dimension-coordinate
+        """
+        return f"{TIME_COO_PREFIX}{self.sim_id}"
+
+    @cached_property
+    def time_var_name(self) -> str:
+        """
+        Name of the real-valued `Xarray data variable`_ holding simulation timestamps.
+        """
+        return f"{TIME_VAR_PREFIX}{self.sim_id}"
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @cached_property
+    def log_attr_name(self) -> str:
+        """
+        Attribute name used by :py:meth:`.AsyncBufferWriter.log_effect`.
+        """
+        return f"{LOG_ATTR_PREFIX}{self.sim_id}"
+
+    @cached_property
+    def success_attr_name(self) -> str:
+        """
+        Attribute name used by :py:meth:`.AsyncBufferWriter.mark_success`.
+        """
+        return f"{SUCCESS_ATTR_PREFIX}{self.sim_id}"
+
+
+# ==============================================================================
+# Xarray output variable
+# ==============================================================================
+
+
+type VariableEncoding = dict[str, Any]
+
+
+# ==============================================================================
+
+
+@dataclass(kw_only=True, slots=True, frozen=True)
+class VariableSpec:
+    """
+    Complete configuration of an output variable for :py:class:`.XarrayEmitter`,
+    including:
+
+    - its name, data type and metadata,
+    - its coordinate data,
+    - its allocation inside :py:class:`.XarrayBuffer`,
+    - and its encoding for :py:class:`.AsyncBufferWriter`.
+
+    This object is created by :py:meth:`.XarrayBuffer.assemble` from a
+    :py:class:`.LeafView` and dynamic metadata.
+
+    .. note::
+      In accordance with `Xarray's view of the Zarr format`_, annotations are
+      placed in :py:attr:`xarray.Dataset.attrs` rather than in
+      :py:attr:`xarray.DataArray.attrs`.
+
+    .. _Xarray's view of the Zarr format: https://docs.xarray.dev/en/stable/internals/zarr-encoding-spec.html
+    """
+
+    #: Simulation metadata.
+    partition: XarrayStoragePartition
+    #: Variable name, determining the output paths both of the coordinate array
+    #: and of the data arrays. This is set automatically for the time variable.
+    var_name: str
+    #: Variable data type.
+    dtype: str
+    #: Unit annotation.
+    unit: str | None
+    #: Coordinate array.
+    coord: np.ndarray | None
+    #: Backend-specific configuration of compression codecs.
+    codecs: dict[str, Any] = field(default_factory=dict)
+    #: Flag for time variables.
+    is_time: bool = False
+
+    def __post_init__(self) -> None:
+        assert isinstance(self.partition, XarrayStoragePartition)
+        assert isinstance(self.var_name, str)
+        assert isinstance(self.dtype, str)
+        assert isinstance(self.unit, str | None)
+        assert isinstance(self.coord, np.ndarray | None)
+        assert isinstance(self.codecs, dict)
+        assert isinstance(self.is_time, bool)
+        assert bool(self.var_name) is not self.is_time
+        assert not (self.is_time and self.coord is None)
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @staticmethod
+    def var_coo_name(var_name: str, /) -> str:
+        """
+        Name of the `Xarray coordinate`_ for a simulation variable.
+        """
+        return f"{VAR_COO_PREFIX}{var_name}"
+
+    @property
+    def coo_name(self) -> str:
+        """
+        Coordinate name used by :py:meth:`.alloc_coord`, which is either a
+        :py:attr:`.XarrayStoragePartition.time_coo_name` or a
+        :py:attr:`.var_coo_name`.
+        """
+        return (self.partition.time_coo_name if self.is_time
+                else self.var_coo_name(self.var_name))
+
+    @property
+    def datavar_name(self) -> str:
+        """
+        Variable name used by :py:meth:`.alloc_var`.
+        """
+        return (self.partition.time_var_name if self.is_time
+                else self.partition.dynamic_suffix)
+
+    @property
+    def dim_names(self) -> tuple[str, ...]:
+        """
+        Dimension names used by :py:meth:`.alloc_var`, which are composed of
+        :py:attr:`.XarrayStoragePartition.time_coo_name` and
+        :py:attr:`.var_coo_name`.
+        """
+        return (self.partition.time_coo_name,) + (
+            () if self.coord is None or self.is_time
+            else (self.var_coo_name(self.var_name),))
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    def dims(self, buf_size: int, /) -> tuple[int, ...]:
+        """
+        Dimension sizes used by :py:meth:`.zeros` and :py:meth:`.encoding`,
+        which are composed of ``buf_size`` and the shape of :py:attr:`.coord`.
+        """
+        return (buf_size,) + (
+            () if self.coord is None or self.is_time
+            else (len(self.coord),))
+
+    def zeros(self, buf_size: int, /) -> np.ndarray:
+        """
+        Allocate a buffer array for storing simulation data.
+        """
+        return np.zeros(self.dims(buf_size), dtype=self.dtype)
+
+    def encoding(
+        self, writer: AsyncBufferWriter, buf_size: int, /
+    ) -> dict[str, VariableEncoding]:
+        """
+        Parameters used for writing a variable array and its coordinate array to
+        persistent storage, including chunk sizes and compression codecs.
+
+        Called by: :py:meth:`.XarrayBuffer.render`.
+
+        Calls: :py:meth:`.AsyncBufferWriter.coo_codecs` and
+        :py:meth:`.AsyncBufferWriter.var_codecs`.
+        """
+        b = writer.config["buffers_per_chunk"]
+        # coordinate encoding
+        match (self.is_time, self.coord):
+            case (False, None):
+                coo_enc = {}
+            case (False, np.ndarray() as coo):
+                coo_enc = {self.coo_name: {
+                    # use 1 storage chunk for the coordinate array
+                    "chunks": coo.shape} | writer.coo_codecs(self)}
+            case (True, np.ndarray() as coo):
+                assert coo.shape == (buf_size,)
+                coo_enc = {self.coo_name: {
+                    # use 1 storage chunk for `b` buffers of the time coordinate
+                    "chunks": (b * buf_size,)} | writer.coo_codecs(self)}
+        # variable encoding
+        var_enc = {self.datavar_name: {
+            # use 1 storage chunk for `b` buffers of simulation data
+            "chunks": self.dims(b * buf_size)} | writer.var_codecs(self)}
+        return coo_enc | var_enc
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @classmethod
+    def make_time(
+        cls, partition: XarrayStoragePartition, buf_size: int, /
+    ) -> Self:
+        """
+        Create the :py:class:`.VariableSpec` for simulation time.
+
+        Called by: :py:meth:`.alloc_time`.
+        """
+        # avoid circular import at module level
+        from ecoli.processes.metabolism import TIME_UNITS
+        assert isinstance(buf_size, int)
+        return cls(
+            partition=partition, var_name="",
+            # type and units for real-valued time stamps
+            dtype=TIME_VAR_DTYPE.str, unit=TIME_UNITS.strUnit(),
+            # integer-valued Xarray dimension coordinate
+            coord=np.arange(buf_size, dtype=TIME_COO_DTYPE),
+            is_time=True)
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @staticmethod
+    def alloc_metadata(
+        partition: XarrayStoragePartition, metadata: dict, /
+    ) -> Dataset:
+        """
+        Allocate the `Xarray attribute`_ for simulation metadata.
+
+        Called by: :py:meth:`.XarrayBuffer.alloc`.
+
+        .. _Xarray attribute: https://docs.xarray.dev/en/stable/user-guide/terminology.html#term-DataTree
+        """
+        return Dataset(attrs={partition.sim_id: metadata})
+
+    def alloc_time(self, buf_size: int, /) -> Dataset:
+        """
+        Allocate the `Xarray dimension coordinate`_ and `Xarray data variable`_
+        for simulation time. ``self`` must be produced by :py:meth:`.make_time`.
+
+        Called by: :py:meth:`.XarrayBuffer.alloc`.
+
+        Calls: :py:meth:`.alloc_coord` and :py:meth:`.alloc_var`.
+        """
+        assert self.is_time and self.coord is not None
+        assert self.coord.shape == (buf_size,)
+        return self.alloc_coord().assign(self.alloc_var(buf_size)._variables)
+
+    def alloc_coord(self) -> Dataset:
+        """
+        Allocate the `Xarray coordinate`_ and `Xarray attributes`_ for an output
+        variable, which *are not* placed under
+        :py:attr:`XarrayStoragePartition.dynamic_suffix`.
+
+        Called by: :py:meth:`.XarrayBuffer.alloc`.
+
+        .. _Xarray coordinate: https://docs.xarray.dev/en/stable/user-guide/terminology.html#term-Coordinate
+        .. _Xarray attributes: https://docs.xarray.dev/en/stable/user-guide/terminology.html#term-Dataset
+        """
+        return Dataset(
+            coords={} if self.coord is None else {self.coo_name: self.coord},
+            attrs={} if self.unit is None else {self.datavar_name: self.unit})
+
+    def alloc_var(self, buf_size: int, /) -> Dataset:
+        """
+        Allocate the `Xarray data variable`_ for an output variable, which *is*
+        placed under :py:attr:`XarrayStoragePartition.dynamic_suffix`.
+
+        Called by: :py:meth:`.XarrayBuffer.alloc`.
+        """
+        return Dataset(data_vars={
+            self.datavar_name: (self.dim_names, self.zeros(buf_size))})
diff --git a/ecoli/library/xarray_emitter/test_xarray_emitter.py b/ecoli/library/xarray_emitter/test_xarray_emitter.py
new file mode 100644
index 000000000..2ac344815
--- /dev/null
+++ b/ecoli/library/xarray_emitter/test_xarray_emitter.py
@@ -0,0 +1,300 @@
+
+"""
+Unit and integration tests for :py:mod:`.xarray_emitter` and its submodules.
+"""
+
+
+from contextlib import ContextDecorator
+from dataclasses import dataclass, field
+from pathlib import Path
+from random import randint
+from typing import Any, Self, final, cast
+
+import numpy as np
+from pytest import MonkeyPatch, mark, param, raises
+from xarray import DataArray, DataTree, open_datatree
+from zarr import Group, open_consolidated
+
+from ecoli.library.test_utils import PatchConfig, filter_warnings
+from ecoli.library.xarray_emitter.emit_path import EmitPath, EmitPathType
+from ecoli.library.xarray_emitter.storage import XarrayStoragePartition
+# from ecoli.library.xarray_emitter.emitter import XarrayEmitter
+from ecoli.library.xarray_emitter.zarr_writer import (
+    AsyncZarrBufferWriter, group_tree)
+from ecoli.library.xarray_emitter.utils import WarningFilter
+from ecoli.processes.metabolism import TIME_UNITS
+
+from runscripts.test_workflow import MockEcoliSimWorkflow
+
+
+# mypy: disable-error-code="attr-defined"
+
+
+# ==============================================================================
+# unit tests
+# ==============================================================================
+
+
+class TestEmitPath:
+
+    @classmethod
+    def test_path_type(cls):
+        assert EmitPath(()).type == EmitPathType(0)
+        assert EmitPath(("agents", "13")).type.is_agent
+        assert EmitPath(("listeners", "foo", "bar")).type.is_listener
+        assert EmitPath(("log_update", "elan_vital")).type.is_update
+        assert EmitPath(("log_update", "", "listeners")).type.is_update_listener
+        with raises(AssertionError):
+            EmitPath(("agents", "0", "listeners"))
+        with raises(AssertionError):
+            EmitPath(("agents", "log_update"))
+        with raises(AssertionError):
+            EmitPath(("log_update", "baz", "log_update"))
+
+
+# ==============================================================================
+# integration tests
+# ==============================================================================
+
+
+ecolisim_warnings = [
+    WarningFilter(
+        module="scipy.integrate._ivp.bdf",
+        category=RuntimeWarning,
+        message="invalid value encountered",
+        action="ignore"),
+]
+
+
+# ------------------------------------------------------------------------------
+
+
+@final
+@dataclass
+class XarrayEmitterConfig(PatchConfig):
+    """
+    :py:class:`.PatchConfig` for the :py:class:`.XarrayEmitter`.
+    """
+
+    store: Path
+    zarr_format: int
+    threaded: bool
+    debug: bool
+    interval: int
+
+    def __post_init__(self) -> None:
+        assert isinstance(self.store, Path)
+        assert self.store.is_absolute()
+        assert not self.store.exists()
+
+    def to_dict(self) -> dict[str, Any]:
+        return {
+            "emitter": "xarray",
+            "emitter_arg": {
+                "writer": {
+                    "store": str(self.store),
+                    "threaded": self.threaded,
+                    "backend": "zarr",
+                    "backend_config": {
+                        "format": self.zarr_format
+                    },
+                },
+                "transducer": {
+                    "predicate": [
+                        [
+                            {"subsample": {"interval": self.interval}},
+                            {"fixed": {"steps": [0]}}
+                        ]
+                    ]
+                },
+                "debug": self.debug
+            }
+        }
+
+
+# ------------------------------------------------------------------------------
+
+
+@dataclass(slots=True)
+class StoreResult(ContextDecorator):
+    """
+    Context manager for opening, using both the Xarray API and the Zarr API, an
+    output store that was produced by :py:class:`.XarrayEmitter` via the
+    :py:class:`.AsyncZarrBufferWriter`.
+    """
+
+    store: Path
+    partition: XarrayStoragePartition
+    zarr_format: int
+    zarr: Group = field(init=False)
+    xarray: DataTree = field(init=False)
+
+    def __post_init__(self) -> None:
+        isinstance(self.store, Path)
+        isinstance(self.partition, XarrayStoragePartition)
+
+    def __enter__(self) -> Self:
+        ind_store = self.store / self.partition.independent_path
+        self.zarr = open_consolidated(
+            ind_store, mode="r", zarr_format=self.zarr_format)
+        self.xarray = open_datatree(
+            ind_store, mode="r", chunks=None, engine="zarr",
+            zarr_format=self.zarr_format, consolidated=True)
+        assert ind_store == self.zarr.store.root
+        assert str(ind_store) == self.xarray.encoding["source"]
+        return self
+
+    def __exit__(self, exc_type, exc, exc_tb):
+        self.close()
+
+    def close(self) -> None:
+        self.zarr.store.close()
+        self.xarray.close()
+
+
+# ------------------------------------------------------------------------------
+
+
+class TestEcoliSim:
+
+    @classmethod
+    @filter_warnings(ecolisim_warnings)
+    @filter_warnings(AsyncZarrBufferWriter.warnings_all())
+    @mark.parametrize(
+        "num_generations, last_success, interval, zarr_format, threaded, debug",
+        [param(*args, **kwargs,
+               id="gen_{}-succ_{}-intvl_{}_zarr_{}-thrd_{}-dbg_{}".format(*args))
+         for (args, kwargs) in [
+            ((1, False, 1, 2, False, True ), {}),
+            ((2, True,  3, 2, True,  False), {}),
+            ((2, True,  2, 3, True,  True), {"marks": mark.basic_workflow}),
+            ((3, False, 1, 3, True,  False), {})
+         ]])
+    def test_workflow(
+        cls, monkeypatch: MonkeyPatch, tmp_path: Path,
+        num_generations: int, last_success: bool, interval: int,
+        zarr_format: int, threaded: bool, debug: bool
+    ):
+        # set repository paths
+        sim_data_path = Path.cwd() / "out" / "kb" / "simData.cPickle"
+        config_name = "test_xarray_emitter"
+
+        # set unique test directories
+        workdir = tmp_path
+        assert workdir.is_absolute()
+        assert workdir.exists()
+        assert not(list(workdir.iterdir()))
+        daughter_outdir = workdir / "daughter_states"
+        store = workdir / "store"
+
+        # configure simulation workflow
+        wf = MockEcoliSimWorkflow(
+            monkeypatch=monkeypatch, workdir=workdir,
+            config_name=config_name, sim_data_path=sim_data_path,
+            daughter_outdir=daughter_outdir,
+            lineage_seed=randint(0, 2**10 - 1),
+            emitter_config=XarrayEmitterConfig(
+                store, zarr_format, threaded, debug, interval))
+
+        # step through workflow
+        hline = "=" * 79
+        for g in range(1, num_generations + 1):
+            print(f"\n{hline}\nGeneration: {g}\n{hline}")
+            # execute simulation
+            success = (g < num_generations) or last_success
+            partition = cast(XarrayStoragePartition, wf.sim_gen(success))
+            # read emitted data
+            with StoreResult(store, partition, zarr_format) as result:
+                # validate emitted data
+                cls.check_tree(result)
+                cls.check_encoding(result)
+                cls.check_log(result)
+                cls.check_success(result, success)
+                cls.check_time(result, interval)
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @staticmethod
+    def check_tree(res: StoreResult) -> None:
+        """
+        Check the basic integrity of the round-tripped
+        :py:class:`xarray.DataTree`.
+        """
+        # let Zarr traverse the store
+        print()
+        print(group_tree(res.zarr))
+
+        # let Xarray traverse the store
+        print()
+        print(res.xarray)
+
+        # inspect current and previous generations
+        p: XarrayStoragePartition | None = res.partition
+        while p is not None:
+            # look for expected fields in the root node
+            assert len(res.xarray.attrs[p.sim_id])
+            assert p.time_var_name in res.xarray.attrs
+            assert p.time_coo_name in res.xarray.coords
+            assert p.time_var_name in res.xarray.data_vars
+            p = p.parent if p.generation > 1 else None
+
+    @staticmethod
+    def check_encoding(res: StoreResult) -> None:
+        pass
+
+    @staticmethod
+    def check_log(res: StoreResult) -> None:
+        """
+        Check the integrity of the write log.
+        """
+        assert {"sim_step", "sim_time"} == set(
+            res.xarray.attrs.get(res.partition.log_attr_name, {}).keys())
+
+    @staticmethod
+    def check_success(res: StoreResult, success: bool) -> None:
+        """
+        Check the validity of the success flag.
+        """
+        assert success == res.xarray.attrs.get(
+            res.partition.success_attr_name, False)
+
+    @staticmethod
+    def check_time(res: StoreResult, interval: int) -> None:
+        """
+        Check the validity of the time variable.
+        """
+        # attribute names
+        sim_id = res.partition.sim_id
+        t_coo = res.partition.time_coo_name
+        t_var = res.partition.time_var_name
+        t_log = res.partition.log_attr_name
+
+        # check time unit
+        assert res.xarray.attrs[t_var] == TIME_UNITS.strUnit()
+
+        # check time coordinate
+        t_ix = res.xarray[t_coo]
+        t_n = len(t_ix)
+        assert np.array_equal(t_ix, np.arange(t_n))
+
+        # time scale, as read from data variable
+        t = cast(DataArray, res.xarray[t_var])
+        t_01 = t[{t_coo: slice(0, 2)}].values
+        t_end = t[{t_coo: -1}].values.item()
+
+        # time scale, as deduced from metadata
+        g = res.partition.generation
+        T_0, dt, dT = map(res.xarray.attrs[sim_id].get,
+                          ["initial_global_time", "time_step", "max_duration"])
+        T_01 = np.cumsum(np.array([1, interval]) * [T_0, dt])
+        T_end = res.xarray.attrs[t_log]["sim_time"]
+        idt = interval * dt
+
+        # check time grid
+        assert T_01[0] == (g - 1) * dT
+        assert T_end == T_01[0] + (dT // idt) * idt
+        assert np.array_equal(T_01, t_01)
+        assert T_end == t_end
+        assert t.values.min() == t_01[0]
+        assert t.values.max() == t_end
+        assert np.array_equiv(np.diff(t), idt)
diff --git a/ecoli/library/xarray_emitter/transducer.py b/ecoli/library/xarray_emitter/transducer.py
new file mode 100644
index 000000000..14849ed29
--- /dev/null
+++ b/ecoli/library/xarray_emitter/transducer.py
@@ -0,0 +1,601 @@
+
+"""
+Core data structures and logic of :py:mod:`.xarray_emitter`.
+
+All other submodules of :py:mod:`.xarray_emitter` are either interfacing with
+upstream (:py:class:`~vivarium.core.engine.Engine`) or downstream
+(:py:class:`.AsyncBufferWriter`) APIs, or configuring those interfaces.
+"""
+
+
+from __future__ import annotations
+
+from dataclasses import dataclass, field
+from functools import cached_property
+from typing import Any, cast, TYPE_CHECKING
+
+import xarray
+from xarray import Dataset, DataTree
+from xarray.core.datatree import NodePath
+
+from vivarium.core.types import HierarchyPath
+from vivarium.library.topology import get_in, dict_to_paths
+
+from .emit_predicate import ConjunctiveEmitPredicate
+from .view import ForestView
+from .storage import XarrayStoragePartition, VariableSpec, VariableEncoding
+from .utils import emitter_arg_error, indent
+
+if TYPE_CHECKING:
+    from .writer import AsyncBufferWriter
+
+
+# ==============================================================================
+
+
+@dataclass
+class XarrayBuffer:
+    """
+    Memory layout for the simulation data held by :py:class:`.XarrayTransducer`.
+
+    This class contains only the logic required for marshalling simulation data
+    into an in-memory hierarchical representation that is aligned with the
+    output :ref:`storage <storage_layout>` and :ref:`variable <variable_layout>`
+    layouts.
+
+    .. note::
+      :py:class:`.XarrayBuffer` *does not* use a `chunked array library`_ for
+      its in-memory Xarray data structures, because it depends on
+      "chunk-unaware" in-place operations for optimizing sequential emission
+      performance. However, the :py:class:`.AsyncZarrBufferWriter` backend
+      *does* control the `Zarr chunks`_ used for writing to persistent storage.
+
+    .. _chunked array library: https://docs.xarray.dev/en/stable/internals/chunked-arrays.html
+    .. _Zarr chunks: https://docs.xarray.dev/en/stable/user-guide/io.html#specifying-chunks-in-a-zarr-store
+    """
+
+    #: Statically configured variable layout transformation.
+    view: ForestView
+    #: Dynamic metadata, received via :py:meth:`!Engine._emit_configuration`.
+    partition: XarrayStoragePartition = field(init=False)
+
+    #: Descriptor for the time variable.
+    time_spec: VariableSpec = field(init=False)
+    #: Descriptors for simulation variables.
+    var_specs: dict[NodePath, VariableSpec] = field(default_factory=dict)
+
+    #: Root node of the :py:class:`~xarray.DataTree` buffer, holding the `Xarray
+    #: attribute`_ for simulation metadata and the cyclic buffer for the
+    #: `Xarray dimension coordinate`_ for simulation time.
+    #:
+    #: .. _Xarray attribute: https://docs.xarray.dev/en/stable/user-guide/terminology.html#term-DataTree
+    #: .. _Xarray dimension coordinate: https://docs.xarray.dev/en/stable/user-guide/terminology.html#term-Dimension-coordinate
+    root: Dataset = field(init=False)
+    #: Child arrays of the :py:class:`~xarray.DataTree` buffer, holding the
+    #: `Xarray coordinates`_ for simulation variables.
+    #:
+    #: .. _Xarray coordinates: https://docs.xarray.dev/en/stable/user-guide/terminology.html#term-Coordinate
+    child_coords: dict[NodePath, Dataset] = field(default_factory=dict)
+    #: Child arrays of the :py:class:`~xarray.DataTree` buffer, holding the
+    #: cyclic buffers for the `Xarray data variables`_ for simulation variables.
+    #:
+    #: .. _Xarray data variables: https://docs.xarray.dev/en/stable/user-guide/terminology.html#term-Variable
+    child_vars: dict[NodePath, Dataset] = field(default_factory=dict)
+
+    def __post_init__(self) -> None:
+        assert isinstance(self.view, ForestView)
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @property
+    def time_coo(self) -> str:
+        """
+        Reference to :py:attr:`.XarrayStoragePartition.time_coo_name`.
+        """
+        return self.partition.time_coo_name
+
+    @property
+    def time_var(self) -> str:
+        """
+        Reference to :py:attr:`.XarrayStoragePartition.time_var_name`.
+        """
+        return self.partition.time_var_name
+
+    @cached_property
+    def output_paths(self) -> dict[HierarchyPath, tuple[NodePath, str]]:
+        """
+        Mapping from input (Vivarium store) to output (Xarray node/variable)
+        hierarchy locations for simulation variables, as defined by
+        :py:attr:`.view` and :py:attr:`.partition`.
+
+        Used by: :py:meth:`.write`.
+        """
+        return {path: (leaf.path, self.partition.dynamic_suffix)
+                for (path, leaf) in self.view.leaves.items()}
+
+    @cached_property
+    def modified_paths(self) -> set[NodePath]:
+        """
+        Relative paths inside the independent substore that are modified during
+        a *daughter* generation. This information may be used by
+        :py:class:`.AsyncBufferWriter` backends for maintaining metadata
+        consistency.
+        """
+        return {NodePath()}
+
+    @cached_property
+    def added_paths(self) -> set[NodePath]:
+        """
+        Relative paths inside the independent substore that are added during a
+        *daughter* generation. This information may be used by
+        :py:class:`.AsyncBufferWriter` backends for maintaining metadata
+        consistency.
+        """
+        root_paths = set(map(NodePath, self.root._variables.keys()))
+        child_var_paths = set(
+            path / cast(str, var)
+            for (path, node) in self.child_vars.items()
+            for var in node._variables.keys())
+        return child_var_paths | root_paths
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    def check_layout(self) -> None:
+        """
+        Basic consistency check, performed before each buffer-level operation.
+        """
+        assert len(self.child_coords) == len(self.child_vars)
+
+    def assemble(self, partition: XarrayStoragePartition, coords: dict) -> None:
+        """
+        Compute :py:attr:`.var_specs` by combining the static configuration
+        :py:attr:`.view` with dynamically obtained metadata.
+
+        Called by: :py:meth:`.XarrayTransducer.alloc`.
+
+        Calls: :py:meth:`.TreeView.make_coords` and :py:class:`.VariableSpec`.
+
+        Args:
+          partition: Result of :py:meth:`.XarrayEmitter.extract_partition`.
+          coords:    Result of :py:meth:`.XarrayEmitter.extract_coords`.
+        """
+        assert isinstance(partition, XarrayStoragePartition)
+        self.partition = partition
+        assert not(self.var_specs)
+        for tree in self.view.forest:
+            for (lf, coo) in zip(tree.leaves, tree.make_coords(coords)):
+                self.var_specs[lf.path] = VariableSpec(
+                    partition=partition, coord=coo,
+                    var_name=lf.var_name, dtype=lf.dtype, unit=lf.unit,
+                    codecs=lf.codecs)
+
+    def alloc(self, buf_size: int, metadata: dict) -> None:
+        """
+        Allocate the in-memory Xarray data structures defined by
+        :py:attr:`.time_spec` and :py:attr:`.var_specs`.
+
+        Called by: :py:meth:`.XarrayTransducer.alloc`.
+
+        Calls: :py:meth:`.VariableSpec.alloc_metadata`,
+        :py:meth:`.VariableSpec.alloc_time`,
+        :py:meth:`.VariableSpec.alloc_coord` and
+        :py:meth:`.VariableSpec.alloc_var`.
+
+        Args:
+          buf_size: :py:attr:`.XarrayTransducer.buf_size`.
+          metadata: Result of :py:meth:`.XarrayEmitter.extract_metadata`.
+        """
+        assert not(self.child_coords)
+        self.time_spec = VariableSpec.make_time(self.partition, buf_size)
+        self.root = self.time_spec.alloc_time(buf_size).assign_attrs(
+            VariableSpec.alloc_metadata(self.partition, metadata)._attrs)
+        for (path, var) in self.var_specs.items():
+            self.child_coords[path] = var.alloc_coord()
+            self.child_vars[path] = var.alloc_var(buf_size)
+
+    def write(
+        self, buf_tix: int, sim_tix: int, t: float, data: dict[str, Any], /
+    ) -> None:
+        """
+        Marshal the simulation data for a single emit step into the output
+        buffer.
+
+        Called by: :py:meth:`XarrayTransducer.step`.
+
+        Args:
+          buf_tix: :py:attr:`.XarrayTransducer.buf_tix`.
+          sim_tix: :py:attr:`.XarrayTransducer.sim_tix`.
+          t:       Simulation time stamp.
+          data:    Input received from :py:meth:`!Engine._emit_store_data`.
+        """
+        # index into buffer along time coordinate
+        t_ix = {self.time_coo: buf_tix}
+
+        # write time stamp to buffer
+        self.root[self.time_var][t_ix] = t
+
+        # strip agent prefix and remove schema paths with empty emit values
+        agent_path = ("agents", self.partition.agent_id)
+        emit_data = dict_to_paths((), get_in(data, agent_path))
+
+        # check for expected emit paths
+        emit_queue = set(self.view.emitted_paths)
+        for (v_path, val) in emit_data:
+            # find output schema location
+            match self.output_paths.get(v_path):
+                case None:
+                    # `v_path` is not an expected emitted path
+                    if sim_tix == 0:
+                        # executed inside `Engine.__init__()`,
+                        # and hence before `XarrayEmitter.reset_emit_flags()`
+                        continue
+                    if self.view.matches_emitted_prefix_path(v_path):
+                        # ignored member of an expected emitted store
+                        continue
+                    raise KeyError(f"Unexpected emit path: {v_path}")
+                case (x_node, x_var):
+                    # write to output schema location inside buffer
+                    self.child_vars[x_node][x_var][t_ix] = val
+                    emit_queue.discard(v_path)
+        if len(emit_queue) and sim_tix > 0:
+            raise KeyError(f"Missing emit paths: {list(emit_queue)}")
+
+    def render(
+        self, writer: AsyncBufferWriter | None, buf_size: int,
+        *, include_static: bool, copy: bool
+    ) -> tuple[xarray.DataTree, dict[str, VariableEncoding]]:
+        r"""
+        Assemble the output buffer components.
+
+        Called by: :py:meth:`.XarrayTransducer.flush`.
+
+        Calls: :py:meth:`.VariableSpec.encoding` and
+        :py:meth:`xarray.DataTree.from_dict`.
+
+        Args:
+          writer:         Used for choosing backend-specific
+                          :py:type:`.VariableEncoding`\ s.
+          buf_size:       :py:attr:`.XarrayTransducer.buf_size`.
+          include_static: Include :py:attr:`.child_coords`
+                          and all :py:type:`.VariableEncoding`\ s.
+          copy:           Return a deep copy of arrays.
+
+        .. note::
+          The deep copy performed here is a conservative choice, which allows
+          the previously allocated buffer to be immediately reused for
+          subsequent writes, without relying on private implementation details
+          about whether and when Xarray or storage backends copy data during
+          their validation, encoding and serialization phases.
+
+          Another similar option would be to force deep copying via a custom
+          ``encoder`` argument to
+          :py:func:`!xarray.backends.writers.dump_to_store`. However, this would
+          merely delay the moment at which the output buffer is handed off from
+          the main thread to the writer thread.
+
+          An alternative conservative choice would be to allocate a new buffer
+          for subsequent writes; this is the approach taken in
+          :py:meth:`.ParquetEmitter.emit`. The present choice is premised on the
+          assumption that, while allocating new arrays is faster than copying
+          arrays, it may be advantageous not to force the hardware cache and
+          main memory to adjust to a new heap representation of the output
+          variable hierarchy along the :py:meth:`.write` code path, particularly
+          when many simulations are running in parallel on the same compute
+          node.
+        """
+        # fetch root node
+        root = {NodePath(): self.root._copy(deep=True) if copy else self.root}
+
+        # fetch child nodes
+        assert set(self.child_coords) == set(self.child_vars)
+        match (include_static, copy):
+            case (False, False):
+                children = self.child_vars
+            case (False, True):
+                children = {
+                    p: n._copy(deep=True)
+                    for (p, n) in self.child_vars.items()}
+            case (True, False):
+                children = {
+                    # `self.child_vars[p]` holds only `data_vars` by construction
+                    p: c.assign(self.child_vars[p]._variables)
+                    for (p, c) in self.child_coords.items()}
+            case (True, True):
+                children = {
+                    p: c._copy(deep=True).assign({
+                        k: v._copy(deep=True)
+                        for (k, v) in self.child_vars[p]._variables.items()})
+                    for (p, c) in self.child_coords.items()}
+
+        # assemble nodes
+        buf = DataTree.from_dict(cast(dict[str, Dataset], root | children))
+
+        # check consistency between composition logic and update logic
+        assert set(str(NodePath("/") / p.parent)
+                   for p in (self.added_paths | self.modified_paths)
+                   ).issubset(buf.groups)
+
+        # fetch encodings
+        enc: dict[str, VariableEncoding] = {}
+        if include_static and writer is not None:
+            enc |= {"": self.time_spec.encoding(writer, buf_size)}
+            enc |= {str(path): var.encoding(writer, buf_size)
+                    for (path, var) in self.var_specs.items()}
+        return (buf, enc)
+
+    def get_time(self, buf_tix: int) -> float:
+        """
+        Called by: :py:meth:`.XarrayTransducer.flush`.
+
+        Args:
+          buf_tix: :py:attr:`.XarrayTransducer.buf_tix`.
+        """
+        t_ix = {self.time_coo: buf_tix}
+        return self.root[self.time_var][t_ix].values.item()
+
+    def shift(self, buf_size: int) -> None:
+        """
+        Called by: :py:meth:`.XarrayTransducer.shift`.
+
+        Args:
+          buf_size: :py:attr:`.XarrayTransducer.buf_size`.
+        """
+        self.root.coords[self.time_coo] = self.root.coords[self.time_coo] + buf_size
+
+    def truncate(self, buf_tix: int) -> None:
+        """
+        Called by: :py:meth:`.XarrayTransducer.truncate`.
+
+        Args:
+          buf_tix: :py:attr:`.XarrayTransducer.buf_tix`.
+        """
+        time_sel = {self.time_coo: slice(0, buf_tix)}
+        self.root = self.root.isel(time_sel)
+        for (path, var) in self.child_vars.items():
+            self.child_vars[path] = var.isel(time_sel)
+
+    def clear(self) -> None:
+        """
+        Called by: :py:meth:`.XarrayTransducer.clear`.
+        """
+        self.root = Dataset()
+        self.child_coords = {}
+        self.child_vars = {}
+
+
+# ==============================================================================
+
+
+class XarrayTransducer:
+    """
+    Essential logical state of :py:class:`.XarrayEmitter`, managing a cyclic
+    buffer of hierarchically organized arrays.
+
+    This class establishes the temporal coupling with
+    :py:class:`~vivarium.core.engine.Engine` and :py:class:`.AsyncBufferWriter`,
+    whereas the :py:class:`.XarrayBuffer` instance it owns is responsible for
+    transforming and holding simulation data.
+
+    Example JSON configuration::
+
+      {
+        "predicate": [...],
+        "buffer": {
+          "size": 3
+        }
+      }
+
+    Here,
+
+      - ``predicate`` defines the criterion for which *simulation steps* also
+        become *emit steps*, and is parsed by
+        :py:class:`.ConjunctiveEmitPredicate`,
+      - while ``size`` is the number of *emit steps* stored in memory by
+        :py:class:`.XarrayBuffer`.
+
+    .. note::
+      The parameter ``size`` is intended to constrain the memory cost of each
+      simulation process, when many parallel simulations are executed in
+      parallel on a node with shared memory. Within that memory budget, larger
+      buffer sizes will result in fewer calls to the transport layer.
+    """
+
+    __slots__ = (
+        "__dict__", "predicate", "buffer",
+        "buf_size", "buf_tix", "sim_tix", "debug"
+    )
+
+    def __init__(self, config: dict[str, Any], /, *, debug: bool=False) -> None:
+        self.validate_config(_config := config["transducer"])
+
+        self.predicate = ConjunctiveEmitPredicate.build(_config["predicate"])
+        """ Criterion for which *simulation steps* also become *emit steps*. """
+
+        view = ForestView.from_dict(config["view"])
+        self.buffer: XarrayBuffer = XarrayBuffer(view)
+        """ In-memory cyclic buffer for simulation data. """
+
+        self.buf_size: int = _config["buffer"]["size"]
+        """ Size of time dimension. """
+        self.buf_tix: int = 0
+        """
+        Current relative *emit step* inside the cyclic buffer; advanced at the
+        end of a :py:meth:`.step` call.
+        """
+        self.sim_tix: int = 0
+        """
+        Current absolute *simulation step*; advanced at the end of a
+        :py:meth:`.step` call.
+        """
+        self.debug: bool = debug
+        """ Flag for debug-level printing. Defaults to ``False``. """
+
+    @classmethod
+    def validate_config(cls, config: dict[str, Any], /) -> None:
+        match config.get("predicate"):
+            case None:
+                raise KeyError(emitter_arg_error(
+                    cls, "Missing argument", "\"buffer\": {\"size\": ...}"))
+        match config.get("buffer", {}).get("size"):
+            case None:
+                raise KeyError(emitter_arg_error(
+                    cls, "Missing argument", "\"buffer\": {\"size\": ...}"))
+            case int(buf_size) if buf_size > 2:
+                pass
+            case buf_size:
+                raise TypeError(emitter_arg_error(
+                    cls, "Invalid argument",
+                    f"\"buffer\": {{\"size\": {buf_size}}}"))
+
+    def __str__(self) -> str:
+        return self.display(self.buffer.render(
+            None, self.buf_size, include_static=True, copy=False)[0])
+
+    def display(self, buf: DataTree, /) -> str:
+        return (
+            f"{self.__class__.__name__}:\n"
+            f"  buf_size: {self.buf_size}\n"
+            f"  sim_tix: {self.sim_tix}, buf_tix: {self.buf_tix}\n"
+            f"  buffer:{indent(4, buf)}")
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    def check_buffer(self) -> None:
+        """
+        Basic consistency check, performed before each buffer-level operation.
+        """
+        assert 0 <= self.buf_tix <= self.buf_size
+        self.buffer.check_layout()
+
+    def alloc(
+        self, *, partition: XarrayStoragePartition, metadata: dict, coords: dict
+    ) -> None:
+        """
+        Allocate an :py:class:`XarrayBuffer` conforming to the output schema.
+        This buffer will be populated by :py:meth:`.step` at every *emit step*,
+        and wll later be sent to the transport layer via :py:meth:`.flush`.
+
+        Called by: :py:meth:`.XarrayEmitter.emit`.
+
+        Args:
+          metadata: Result of :py:meth:`.XarrayEmitter.extract_metadata`.
+          coords: Result of :py:meth:`.XarrayEmitter.extract_coords`.
+        """
+        self.check_buffer()
+        self.buffer.assemble(partition, coords)
+        self.buffer.alloc(self.buf_size, metadata)
+        self.check_buffer()
+
+    def step(self, data: dict[str, Any], /) -> bool:
+        r"""
+        If :py:attr:`.predicate` is satisfied for the current *simulation step*,
+        then create a new *emit step* by writing the simulation data into
+        :py:attr:`.buffer`.
+
+        Called by: :py:meth:`.XarrayEmitter.emit`.
+
+        Calls: :py:meth:`.ConjunctiveEmitPredicate.__call__` and
+        :py:meth:`.XarrayBuffer.write`.
+
+        Args:
+          data: Payload from :py:meth:`.XarrayEmitter.emit`.
+
+        Returns:
+          `False` if the buffer is full and the operation cannot be performed
+          without first :py:meth:`.flush`\ ing, otherwise `True`.
+        """
+        if self.predicate(self.sim_tix, t := get_in(data, ("time",)), data):
+            if self.buf_tix < self.buf_size:
+                # fill current emit step
+                self.buffer.write(self.buf_tix, self.sim_tix, t, data)
+                # increment emit step
+                self.buf_tix += 1
+            else:
+                # writing now would result in an `IndexError`
+                return False
+        # increment simulation step
+        self.sim_tix += 1
+        return True
+
+    def flush(
+        self, writer: AsyncBufferWriter, *, include_static: bool, final: bool
+    ) -> tuple[xarray.DataTree, dict[str, VariableEncoding], dict[str, Any]]:
+        r"""
+        Assemble the output buffer that will be sent to persistent storage, and
+        perform associated cache and memory management tasks.
+
+        Called by: :py:meth:`.AsyncBufferWriter.write`.
+
+        Calls: :py:meth:`.XarrayBuffer.render` and
+        :py:meth:`.AsyncBufferWriter.merge_attributes`.
+
+        Args:
+          writer:         Used for choosing backend-specific
+                          :py:type:`.VariableEncoding`\ s and for combining
+                          metadata.
+          include_static: Include :py:attr:`.XarrayBuffer.child_coords`
+                          and all :py:type:`.VariableEncoding`\ s.
+          final:          Indicate the final buffer.
+
+        Returns:
+          - A deep copy of the in-memory buffer.
+          - Backend-specific variable encodings, only if ``include_static``.
+          - A JSON-serializable reference to the latest emitted simulation step.
+        """
+        self.check_buffer()
+        if final:
+            assert not include_static
+            if self.buf_tix < self.buf_size:
+                # at least one unfilled emit step inside allocated buffer
+                self.truncate()
+        else:
+            assert self.buf_tix == self.buf_size
+        (buf, enc) = self.buffer.render(
+            writer, self.buf_size,
+            include_static=include_static, copy=not final)
+        writer.merge_attributes(buf)
+        ref = {"sim_step": self.sim_tix,
+               "sim_time": self.buffer.get_time(self.buf_tix - 1)}
+        if final:
+            # reference to buffer components no longer needed
+            self.clear()
+        if self.debug:
+            hline = "-" * 79
+            print(hline, "\n", self.display(buf), "\n", hline)
+        return (buf, enc, ref)
+
+    def shift(self) -> None:
+        """
+        Shift the time coordinate by the buffer size, without modifying the
+        buffer content otherwise. This is used after a full buffer has been
+        flushed, and before new values are written to it.
+
+        Calls: :py:meth:`.XarrayBuffer.shift`.
+        """
+        self.check_buffer()
+        assert self.buf_tix == self.buf_size
+        self.buf_tix = 0
+        self.buffer.shift(self.buf_size)
+
+    def truncate(self) -> None:
+        """
+        Remove excess buffer space before flushing the final buffer.
+
+        Called by: :py:meth:`.flush`.
+
+        Calls: :py:meth:`.XarrayBuffer.truncate`.
+        """
+        self.buf_size = self.buf_tix
+        self.buffer.truncate(self.buf_tix)
+
+    def clear(self) -> None:
+        """
+        Empty all buffer components after flushing the final buffer.
+
+        Called by: :py:meth:`.flush`.
+
+        Calls: :py:meth:`.XarrayBuffer.clear`.
+        """
+        self.buf_tix = 0
+        self.sim_tix = 0
+        self.buffer.clear()
diff --git a/ecoli/library/xarray_emitter/utils.py b/ecoli/library/xarray_emitter/utils.py
new file mode 100644
index 000000000..197749ed7
--- /dev/null
+++ b/ecoli/library/xarray_emitter/utils.py
@@ -0,0 +1,65 @@
+
+"""
+Debugging, warnings & errors.
+"""
+
+
+from collections.abc import Iterator
+from contextlib import contextmanager
+from dataclasses import dataclass, astuple
+from itertools import starmap
+from typing import Literal
+from warnings import filterwarnings, catch_warnings
+
+
+# ==============================================================================
+
+
+def indent(s: int, obj: object):
+    return f"\n{s*" "}".join([""] + repr(obj).split("\n"))
+
+
+# ------------------------------------------------------------------------------
+
+
+def emitter_arg_error(obj: object | type, msg: str, args: str, /) -> str:
+    return (f"\n  {msg} for "
+            f"{(obj if isinstance(obj, type) else obj.__class__).__name__}:"
+            f"\n    {{\"emitter_arg\": {{{args}}}}}")
+
+
+# ------------------------------------------------------------------------------
+
+
+@dataclass(kw_only=True, slots=True, frozen=True)
+class WarningFilter:
+    """
+    Data class for specifying warning filters. Passed to
+    :py:func:`warnings.filterwarnings` as a tuple, and to
+    :py:func:`pytest.mark.filterwarnings` as a string.
+    """
+
+    action: Literal["ignore", "error"]
+    message: str
+    category: type[Warning]
+    module: str
+
+    def __post_init__(self) -> None:
+        assert issubclass(self.category, Warning)
+
+    def __str__(self) -> str:
+        wtyp = self.category
+        wmod = "" if ((wmod := wtyp.__module__) == "builtins") else f"{wmod}."
+        w = f"{wmod}{wtyp.__name__}"
+        return f"{self.action}:{self.message}:{w}:{self.module}"
+
+
+@contextmanager
+def filter_warnings(filters: list[WarningFilter]) -> Iterator[None]:
+    """
+    Context manager for activating a collection of warning filters using
+    :py:func:`warnings.filterwarnings`.
+    """
+    with catch_warnings():
+        list(starmap(filterwarnings, map(astuple, filters)))
+        yield None
diff --git a/ecoli/library/xarray_emitter/view.py b/ecoli/library/xarray_emitter/view.py
new file mode 100644
index 000000000..e25eaff9b
--- /dev/null
+++ b/ecoli/library/xarray_emitter/view.py
@@ -0,0 +1,386 @@
+
+"""
+Specification of the schema transformation from the input hierarchy (Vivarium
+stores) to the output hierarchy (Xarray nodes/variables), which is used to
+construct the in-memory representation of :py:class:`.XarrayBuffer`.
+
+See :ref:`variable_layout` for an overview.
+"""
+
+
+from __future__ import annotations
+
+from collections.abc import Iterator
+from dataclasses import dataclass, field
+from operator import itemgetter
+from itertools import chain
+from functools import cached_property
+from typing import Any, Self
+
+import numpy as np
+from xarray.core.datatree import NodePath
+
+import unum
+import pint
+
+from vivarium.core.types import HierarchyPath
+from vivarium.library.topology import get_in, dict_to_paths
+
+from .utils import emitter_arg_error
+from .emit_path import EmitPath
+
+
+# ==============================================================================
+
+
+@dataclass(kw_only=True, slots=True)
+class LeafView:
+    """
+    Specification for how an individual Vivarium variable should be mapped onto
+    a :py:class:`~xarray.DataArray` inside an eventual
+    :py:class:`~xarray.DataTree` hierarchy.
+
+    Example JSON configuration with default codecs::
+
+      {
+        "path": "metabolism/fluxes/internal/rxn",
+        "unit": "[mmol/L.s]",
+        "dtype": "<f4"
+      }
+
+    Example JSON configuration with custom codecs for the Zarr backend::
+
+      {
+        "path": "bulk/bulk_molecule",
+        "dtype": "<i8",
+        "codecs": {
+          "filters_v2": [],
+          "filters_v3": [],
+          "compressors_v2": [{
+            "id": "lzma", "format": 3, "check": -1, "preset": null,
+            "filters": [{"id": 3, "dist": 8}, {"id": 33, "preset": 5}]
+          }],
+          "compressors_v3": [{
+            "name": "numcodecs.lzma",
+            "configuration": {
+              "format": 3,
+              "filters": [{"id": 3, "dist": 8}, {"id": 33, "preset": 5}]
+            }
+          }]
+        }
+      }
+
+    The value of ``codecs`` is interpreted by
+    :py:meth:`.AsyncBufferWriter.coo_codecs` and
+    :py:meth:`.AsyncBufferWriter.var_codecs`.
+
+    .. hint::
+      In this example, ``_v2``/``_v3`` refers to the Zarr format, which is
+      chosen by the configuration value ``emitter_arg.writer.zarr.format``. Zarr
+      codecs only need to be specified in both formats if both formats will be
+      used.
+    """
+
+    #: Target variable path inside the eventual :py:class:`~xarray.DataTree`.
+    path: NodePath
+    #: `Data type`_ for the output :py:class:`~xarray.DataArray`, provided either
+    #: as a string or as a :py:class:`numpy.dtype`.
+    #:
+    #: .. _Data type: https://numpy.org/doc/stable/reference/arrays.dtypes.html
+    dtype: str
+    #: Unit string to store as an attribute inside the node, provided either
+    #: as a string, as a :py:class:`pint.Unit`, or as a :py:class:`unum.Unum`.
+    unit: str | None = None
+    #: Backend-specific configuration of output codecs.
+    codecs: dict[str, Any] = field(default_factory=dict)
+
+    def __post_init__(self) -> None:
+        # parse variable name
+        match self.path:
+            case NodePath():
+                pass
+            case str():
+                self.path = NodePath(self.path)
+            case p:
+                raise TypeError(
+                    f"Expected (str|NodePath) in `.path`, but received: {p}")
+        if not len(self.path.parts):
+            raise ValueError(
+                f"Expected non-empty `.path`, but received: {self.path}")
+        # parse dtype
+        match self.dtype:
+            case str() | np.dtype() | type():
+                self.dtype = np.dtype(self.dtype).str
+            case t:
+                raise TypeError(
+                    f"Expected (str|np.dtype) in `.dtype` for output variable "
+                    f"\"{self.path}\", but received: {t}")
+        # parse unit
+        match self.unit:
+            case None:
+                pass
+            case "":
+                raise TypeError(
+                    f"Use `None` instead of \"\" in `.unit` for output variable "
+                    f"\"{self.path}\".")
+            case str(u):
+                if not (u.startswith("[") and u.endswith("]")):
+                    raise ValueError(
+                        f"Expected \"[...]\" in `.unit` for output variable "
+                        f"\"{self.path}\", but received: {u}")
+            case pint.Unit() as u:
+                self.unit = f"[{u}]"
+            case unum.Unum() as u:
+                if u.asNumber() != 1.0:
+                    raise ValueError(
+                        f"No numerical value expected in `.unit` for "
+                        f"output variable \"{self.path}\", but received: {u}")
+                self.unit = u.strUnit()
+            case u:
+                raise TypeError(
+                    f"Expected (None|str|pint.Unit|unum.Unum) in `.unit` for"
+                    f"output variable \"{self.path}\", but received: {u}")
+        if not isinstance(self.codecs, dict):
+            raise TypeError(
+                f"Expected (dict) in `.codecs` for output variable "
+                f"\"{self.path}\", but received: {self.codec}")
+
+    @classmethod
+    def from_dict(cls, config: dict[str, Any], /) -> Self:
+        return cls(**config)
+
+    def to_dict(self) -> dict[str, str | None]:
+        return {"path": str(self.path), "dtype": self.dtype, "unit": self.unit}
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @property
+    def var_name(self) -> str:
+        return self.path.name
+
+
+# ==============================================================================
+
+
+@dataclass(kw_only=True)
+class TreeView:
+    """
+    A mapping from a Vivarium schema to a partial :py:class:`~xarray.DataTree`
+    specification, assuming that the input schema has a uniform metadata
+    provider --- i.e., either metadata with a common root path, or no metadata
+    at all.
+
+    Example JSON configuration::
+
+      {
+        "root": ["log_update", "ecoli-metabolism", "listeners"],
+        "variables": {
+          "fba_results": {
+            "coefficient": [{...}],
+            "reaction_fluxes": [{...}],
+            "external_exchange_fluxes": [{...}]
+          },
+          "enzyme_kinetics": {
+            "counts_to_molar": [{...}],
+            "actual_fluxes": [{...}],
+            "target_fluxes": [{...}]
+          }
+        }
+      }
+
+    Here, ``variables`` represents a Vivarium schema, and should map directly
+    onto the :py:class:`~vivarium.core.store.Store` hierarchy under ``root``.
+    Each ``[{...}]`` is parsed into a :py:class:`.LeafView`, and is enclosed by
+    a JSON array in order to distinguish it syntactically from the arbitrary
+    nesting of JSON objects.
+    """
+
+    #: Path within an agent store, which is used for extracting both
+    #: simulation data and associated metadata. Provided as a
+    #: :py:data:`~vivarium.core.types.HierarchyPath`, and parsed into an
+    #: :py:class:`.EmitPath`.
+    root: EmitPath
+    #: Flag for extracting coordinate annotations from the result of
+    #: :py:meth:`~ecoli.experiments.ecoli_master_sim.EcoliSim.output_metadata`.
+    metadata: bool = True
+    #: Schema relative to :py:attr:`.root`, holding :py:class:`.LeafView`
+    #: arguments as leaf values.
+    variables: dict[str, Any]
+
+    #: Input :py:data:`~vivarium.core.types.HierarchyPath`\ s
+    #: extracted from :py:attr:`.variables`.
+    paths: list[HierarchyPath] = field(init=False)
+    #: Output :py:class:`.LeafView`\ s parsed from :py:attr:`.variables`.
+    leaves: list[LeafView] = field(init=False)
+
+    def __post_init__(self) -> None:
+        self.root = EmitPath(self.root)
+        assert not self.root.type.is_agent
+        assert isinstance(self.metadata, bool)
+        assert isinstance(self.variables, dict)
+        if not len(self.variables):
+            raise self._arg_error("Missing arguments", "")
+        paths, leaves = map(list, zip(*dict_to_paths((), self.variables)))
+        if not all(map(len, paths)):
+            raise self._arg_error("Empty path", "...")
+        if len(frozenset(paths)) != len(paths):
+            raise self._arg_error("Duplicate paths", "...")
+        for (path, leaf) in zip(paths, leaves):
+            if not len(leaf) == 1:
+                raise self._arg_error(
+                    f"Expected single output spec for path f{path}", "...")
+        self.paths = paths
+        self.leaves = list(map(LeafView.from_dict, map(itemgetter(0), leaves)))
+
+    def _arg_error(self, msg: str, variables: str) -> ValueError:
+        return ValueError(emitter_arg_error(
+            self, msg,
+            f"\"view\": ["
+            f"\n      {{\"root\": {self.root.path},"
+            f"\n        \"variables\": {{{variables}}}}}]"))
+
+    @classmethod
+    def from_dict(cls, config: dict[str, Any], /) -> Self:
+        return cls(**config)
+
+    def to_dict(self) -> dict[str, str | bool | dict[str, Any]]:
+        return {"root": self.root.path, "metadata": self.metadata,
+                "variables": self.variables}
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @cached_property
+    def emitting_paths(self) -> list[HierarchyPath]:
+        r"""
+        Collection of :py:attr:`.EmitPath.emitting_path`\ s.
+        """
+        if self.root.type.is_update:
+            return [self.root.emitting_path]
+        else:
+            return [self.root.emitting_path + p for p in self.paths]
+
+    @cached_property
+    def emitted_paths(self) -> list[HierarchyPath]:
+        """
+        Composition of :py:attr:`.root` and :py:attr:`.paths`.
+        """
+        return [self.root.path + p for p in self.paths]
+
+    @cached_property
+    def emitted_prefix_paths(self) -> list[HierarchyPath]:
+        """
+        If a path is contained in :py:attr:`.emitted_paths` but not in
+        :py:attr:`.emitting_paths`, then it should have a prefix matching this
+        collection.
+        """
+        if self.root.type.is_update:
+            return [self.root.emitting_path]
+        else:
+            return []
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @staticmethod
+    def serialize_coord(coo: Any, /) -> np.ndarray | None:
+        """
+        Called by: :py:meth:`.make_coords`.
+        """
+        return None if coo is None else np.array(coo, copy=None)
+
+    def make_coords(
+        self, coords: dict[str, Any], /
+    ) -> Iterator[np.ndarray | None]:
+        """
+        Extract coordinate annotations from the result of
+        :py:meth:`.EcoliSim.output_metadata`.
+
+        Called by: :py:meth:`.XarrayBuffer.assemble`.
+
+        Calls: :py:meth:`.serialize_coord`.
+
+        Args:
+          coords: Result of :py:meth:`.XarrayEmitter.extract_coords`.
+        """
+        if self.metadata:
+            root: dict[str, Any] = get_in(coords, self.root.metadata_path)
+            for p in self.paths:
+                yield self.serialize_coord(get_in(root, p))
+        else:
+            for _ in self.paths:
+                yield None
+
+
+# ==============================================================================
+
+
+@dataclass
+class ForestView:
+    """
+    Specification for how a collection of Vivarium schema entries and their
+    metadata should be mapped onto a complete :py:class:`~xarray.DataTree`.
+
+    Example JSON configuration::
+
+      [
+        {...},
+        {...},
+        {...}
+      ]
+
+    Here, each ``{...}`` is parsed into a :py:class:`.TreeView`.
+    """
+
+    #: Full schema with :py:class:`.LeafView` leaves.
+    forest: list[TreeView]
+
+    def __post_init__(self) -> None:
+        assert isinstance(self.forest, list)
+        assert all(isinstance(t, TreeView) for t in self.forest)
+        if not len(self.forest):
+            raise ValueError(emitter_arg_error(
+                self, "Missing arguments", "\"view\": [...]"))
+        paths = list(chain.from_iterable(t.paths for t in self.forest))
+        if len(frozenset(paths)) != len(paths):
+            raise ValueError(emitter_arg_error(
+                self, "Duplicate paths", "\"view\": [...]"))
+
+    @classmethod
+    def from_dict(cls, config: list[dict[str, Any]], /) -> Self:
+        return cls(list(map(TreeView.from_dict, config)))
+
+    def to_dict(self) -> list[dict[str, str | bool | dict]]:
+        return [t.to_dict() for t in self.forest]
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @cached_property
+    def emitting_paths(self) -> list[HierarchyPath]:
+        """
+        Union of :py:attr:`.TreeView.emitting_paths`.
+        """
+        return [p for t in self.forest for p in t.emitting_paths]
+
+    @cached_property
+    def emitted_paths(self) -> list[HierarchyPath]:
+        """
+        Union of :py:attr:`.TreeView.emitted_paths`.
+        """
+        return [p for t in self.forest for p in t.emitted_paths]
+
+    def matches_emitted_prefix_path(self, path: HierarchyPath, /) -> bool:
+        """
+        Compare ``path`` against the union of
+        :py:attr:`.TreeView.emitted_prefix_paths`.
+        """
+        return any(path[:len(p)] == p
+                   for t in self.forest for p in t.emitted_prefix_paths)
+
+    @cached_property
+    def leaves(self) -> dict[HierarchyPath, LeafView]:
+        r"""
+        Map emitted Vivarium paths onto :py:class:`.LeafView`\ s.
+
+        Called by: :py:meth:`.XarrayBuffer.assemble`.
+        """
+        return dict(chain.from_iterable(
+            zip(t.emitted_paths, t.leaves) for t in self.forest))
diff --git a/ecoli/library/xarray_emitter/writer.py b/ecoli/library/xarray_emitter/writer.py
new file mode 100644
index 000000000..935ed5195
--- /dev/null
+++ b/ecoli/library/xarray_emitter/writer.py
@@ -0,0 +1,523 @@
+
+"""
+Abstract base classes that determine the transport and session layers of
+:py:mod:`.xarray_emitter`.
+
+Backend-specific code should be placed into subclasses in a separate module.
+"""
+
+
+from __future__ import annotations
+
+from abc import ABC, abstractmethod
+from collections.abc import Callable, Coroutine
+from concurrent.futures import Future, Executor, ThreadPoolExecutor
+from functools import cached_property
+from inspect import ismethod
+from pathlib import Path
+from typing import Any
+from weakref import finalize
+
+import numpy as np
+from xarray import DataTree
+from xarray.core.datatree import NodePath
+from xarray.backends.common import ArrayWriter
+
+from ..parquet_emitter import BlockingExecutor
+from .utils import WarningFilter, filter_warnings, emitter_arg_error
+from .storage import XarrayStoragePartition, VariableSpec, VariableEncoding
+from .transducer import XarrayBuffer, XarrayTransducer
+
+
+# ==============================================================================
+
+
+class AsyncArrayWriter[ArrT](ArrayWriter, ABC):
+    """
+    Low-level control over the write operations generated by an
+    :py:class:`!xarray.backends.common.AbstractWritableDataStore` is implemented
+    by monkey-patching the Xarray stack layer that plays the role of an
+    `algebraic effect system`_ for storage updates, namely:
+
+      - by subclassing the effect type
+        :py:class:`!xarray.backends.common.ArrayWriter`,
+      - by intercepting the write operations passed to :py:meth:`.add`,
+      - and by controlling their execution in :py:meth:`.sync`.
+
+    .. _algebraic effect system: https://en.wikipedia.org/wiki/Effect_system
+    """
+
+    def add(self, source, target, region=None) -> None:
+        """
+        Enqueue a write operation for the transport layer, after all encodings
+        and checks at the presentation and session layers have succeeded.
+
+        Called by:
+        :py:meth:`!xarray.backends.common.AbstractWritableDataStore.set_variables`.
+        """
+        # expect materialised slices along time dimension
+        assert isinstance(source, np.ndarray)
+        assert isinstance(target, self.target_type)
+        assert all(isinstance(d, slice) for d in region)
+        self.sources.append(source)
+        self.targets.append(target)
+        self.regions.append(region)
+
+    def sync(self, compute=True, chunkmanager_store_kwargs=None) -> None:
+        """
+        Send the enqueued write operations asynchronously over the transport
+        layer, and wait until all operations have completed.
+
+        Calls: :py:meth:`._sync`.
+        """
+        # the write queue should not be empty
+        assert self.sources
+        # no external synchronisation mechanism should be active
+        assert self.lock is None
+        # no external chunk manager should be active
+        assert chunkmanager_store_kwargs is None
+        self._sync(self._async())
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @property
+    @abstractmethod
+    def target_type(self) -> type[ArrT]:
+        """
+        Expected type of backend-specific target object for write operations.
+        """
+        ...
+
+    @abstractmethod
+    def _sync(self, coro: Coroutine[None, None, None], /) -> None:
+        """
+        Synchronization barrier for :py:meth:`._async`.
+        """
+        ...
+
+    @abstractmethod
+    async def _async(self) -> None:
+        """
+        Coroutine executing the enqueued write operations asynchronously.
+        """
+        ...
+
+
+# ==============================================================================
+
+
+class AsyncBufferWriter[StoreT](ABC):
+    """
+    Backend-agnostic session layer for emitting :py:class:`.XarrayBuffer`
+    contents to some persistent storage, and for doing so sequentially (i.e.,
+    reusing file handles, metadata and caches) and concurrently (i.e., hiding
+    transport latency and pooling channel bandwidths). See :ref:`concurrency`
+    for the design rationale.
+
+    This abstract class is responsible for managing the session state on the
+    side of the :py:class:`.XarrayEmitter`, and for coordinating the main and
+    writer threads, at the time scale at which a buffer is filled with
+    simulation data. Within this time scale, backend-specific subclasses are
+    responsible for managing the session state on the side of the transport
+    layer, and for controlling its concurrency.
+
+    Example JSON configuration::
+
+      {
+        "store": "out/store",
+        "threaded": true,
+        "buffers_per_chunk": 10,
+        "backend": "zarr",
+        "backend_config": {...}
+      }
+
+    Here,
+
+      - ``store`` is a URI interpreted by the backend,
+      - ``threaded`` toggles the use of a separate writer thread,
+      - ``buffers_per_chunk`` is the integer-valued size ratio, in terms of
+        *emit step* counts, between one chunk of backend storage and one
+        in-memory buffer,
+      - ``backend`` determines the transport layer subclass instantiated by
+        :py:meth:`.dispatch`, e.g., :py:class:`.AsyncZarrBufferWriter`,
+      - and ``backend_config`` is interpreted by the backend subclass.
+
+    .. note::
+      The parameter ``buffers_per_chunk`` is intended to decouple the number of
+      output files from the choice of ``transducer.buffer.size`` in
+      :py:class:`.XarrayTransducer`. As a rule of thumb, 1 chunk file per
+      variable per generation is desirable in order to minimize the file system
+      pressure, unless a downstream application can benefit from smaller file
+      sizes.
+
+      The latter situation appears to be unlikely under current simulation use
+      cases. However, it may be supported in the future by extending the writer
+      configuration to further distinguish between *chunks* and *shards*, which
+      is `supported`_ by backends like Zarr.
+
+    .. _supported: https://zarr.readthedocs.io/en/latest/user-guide/performance/#sharding
+    """
+
+    @classmethod
+    def dispatch(cls, config: dict[str, Any], /) -> AsyncBufferWriter:
+        """
+        Instantiate the subclass matching ``config.emitter_arg.writer.backend``.
+        """
+        match config.get("backend"):
+            case None:
+                raise KeyError(emitter_arg_error(
+                    cls, "Missing argument", "\"writer\": {\"backend\": ...}"))
+            case "zarr":
+                # avoid circular import at module level
+                from .zarr_writer import AsyncZarrBufferWriter
+                return AsyncZarrBufferWriter(config)
+            case backend:
+                raise TypeError(emitter_arg_error(
+                    cls, "Unsupported backend",
+                    f"\"writer\": {{\"backend\": \"{backend}\"}}"))
+
+    def __init__(self, config: dict[str, Any], /) -> None:
+        self.validate_config(config)
+        self.config: dict[str, Any] = config
+        """ Static configuration, received via :py:meth:`!Emitter.__init__`. """
+
+        self._buffer: XarrayBuffer | None = None
+        self._store: StoreT | None = None
+        self._store_finalizer: Callable[[], None] | None = None
+        """ Finalizer for :py:attr:`.store`. """
+        self.executor: Executor = (ThreadPoolExecutor(max_workers=1)
+                                   if config.get("threaded", True)
+                                   else BlockingExecutor())
+        """ Thread executing :py:meth:`._write`. """
+        self.future: Future = Future()
+        """ Synchronisation primitive for :py:attr:`.executor`. """
+        self.future.set_result(None)
+        self.num_writes: int = 0
+        """ Count of submitted buffer writes. """
+
+    @classmethod
+    def validate_config(cls, config: dict[str, Any], /) -> None:
+        """
+        Check assumptions about static writer configuration.
+        """
+        match config["store"]:
+            case (str() | Path()) as store if not str(store).endswith("/"):
+                pass
+            case store:
+                raise TypeError(emitter_arg_error(
+                    cls, "Invalid store path",
+                    f"\"writer\": {{\"store\": \"{store}\"}}"))
+        match config.get("buffers_per_chunk"):
+            case None:
+                raise KeyError(emitter_arg_error(
+                    cls, "Missing argument",
+                    "\"writer\": {\"buffers_per_chunk\": ...}"))
+            case int(b) if b >= 1:
+                pass
+            case b:
+                raise ValueError(emitter_arg_error(
+                    cls, "Invalid argument",
+                    "\"writer\": {\"buffers_per_chunk\": ...}"))
+        match config.get("backend_config"):
+            case None:
+                raise KeyError(emitter_arg_error(
+                    cls, "Missing argument",
+                    "\"writer\": {\"backend_config\": {...}}"))
+            case dict():
+                pass
+            case c:
+                raise ValueError(emitter_arg_error(
+                    cls, "Invalid argument",
+                    f"\"writer\": {{\"backend_config\": {c}}}"))
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @property
+    def buffer(self) -> XarrayBuffer:
+        """
+        Dynamic configuration, received via :py:meth:`!Engine._emit_configuration`.
+        """
+        assert self._buffer is not None
+        return self._buffer
+
+    @buffer.setter
+    def buffer(self, buffer: XarrayBuffer) -> None:
+        assert self._buffer is None
+        assert isinstance(buffer, XarrayBuffer)
+        self._buffer = buffer
+
+    @property
+    def partition(self) -> XarrayStoragePartition:
+        """
+        Reference to :py:attr:`.XarrayBuffer.partition`.
+        """
+        return self.buffer.partition
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @property
+    @abstractmethod
+    def store_type(self) -> type[StoreT]:
+        """
+        Expected type of backend-specific transport layer.
+        """
+        ...
+
+    def open_store(self, buffer: XarrayBuffer, /) -> None:
+        """
+        Initialise the transport layer.
+
+        Calls: :py:meth:`._open_store`.
+
+        Args:
+          buffer: Used for obtaining dynamic metadata that is received through
+                  :py:meth:`!Engine._emit_configuration`.
+        """
+        self.buffer = buffer
+        self.store = self._open_store()
+
+    @abstractmethod
+    def _open_store(self) -> StoreT:
+        """
+        Initialise the backend-specific transport layer.
+
+        Called by: :py:meth:`.open_store`.
+        """
+        ...
+
+    @property
+    def store(self) -> StoreT:
+        """
+        Transport layer.
+        """
+        assert self._store is not None
+        assert self._store_finalizer is not None
+        return self._store
+
+    @store.setter
+    def store(self, store: StoreT) -> None:
+        assert self._store is None
+        assert self._store_finalizer is None
+        assert isinstance(store, self.store_type)
+        assert ismethod(getattr(store, "close", None))
+        self._store = store
+        self._store_finalizer = finalize(self, store.close)  # type: ignore[attr-defined]
+
+    def close(self) -> None:
+        """
+        Terminate the :py:attr:`.executor` thread, call :py:meth:`.consolidate`,
+        and close the :py:attr:`.store`.
+        """
+        if self.num_writes > 0:
+            self.sync(shutdown=True)
+        self.executor.shutdown(wait=True)
+        self.consolidate()
+        assert self._store_finalizer is not None
+        self._store_finalizer()
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @abstractmethod
+    def coo_codecs(self, var: VariableSpec, /) -> VariableEncoding:
+        """
+        Interpret the JSON config for the backend-specific codecs of a
+        simulation coordinate.
+
+        Called by: :py:meth:`.VariableSpec.encoding`.
+        """
+        ...
+
+    @abstractmethod
+    def var_codecs(self, var: VariableSpec, /) -> VariableEncoding:
+        """
+        Interpret the JSON config for the backend-specific codecs of a
+        simulation variable.
+
+        Called by: :py:meth:`.VariableSpec.encoding`.
+        """
+        ...
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @classmethod
+    @abstractmethod
+    def warnings_make_effect(cls) -> list[WarningFilter]:
+        """
+        Filters for warnings expected in the transport layer.
+        """
+        ...
+
+    @cached_property
+    def _warnings_make_effect(self) -> list[WarningFilter]:
+        return self.warnings_make_effect()
+
+    @classmethod
+    @abstractmethod
+    def warnings_eval_effect(cls) -> list[WarningFilter]:
+        """
+        Filters for warnings expected in the transport layer.
+        """
+        ...
+
+    @cached_property
+    def _warnings_eval_effect(self) -> list[WarningFilter]:
+        return self.warnings_make_effect()
+
+    @classmethod
+    def warnings_all(cls) -> list[WarningFilter]:
+        """
+        Combine :py:meth:`.warnings_make_effect` and
+        :py:meth:`.warnings_eval_effect`.
+        """
+        return cls.warnings_make_effect() + cls.warnings_eval_effect()
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @abstractmethod
+    def merge_attributes(self, payload: DataTree) -> None:
+        """
+        :py:meth:`.XarrayBuffer.render` is designed to only output chunk-level
+        changes to Xarray variables and attributes. While variables are always
+        either introduced or appended, some transport layer backends may
+        *overwrite* attribute containers instead of *updating* them, which would
+        invalidate attributes at :py:attr:`.XarrayBuffer.modified_paths`. This
+        method allows such conflicts to be resolved in-place, before the payload
+        is passed to :py:meth:`.make_effect`.
+
+        Called by: :py:meth:`.XarrayTransducer.flush`.
+        """
+        ...
+
+    @abstractmethod
+    def make_effect(
+        self,
+        payload: DataTree,
+        encoding: dict[str, dict[str, VariableEncoding]], /
+    ) -> AsyncArrayWriter:
+        """
+        Enqueue write operations for the transport layer.
+
+        Called by: :py:meth:`._write`.
+        """
+        ...
+
+    @staticmethod
+    def eval_effect(eff: AsyncArrayWriter, /) -> None:
+        """
+        Execute write operations in the transport layer.
+
+        Called by: :py:meth:`._write`.
+
+        Calls: :py:meth:`.AsyncArrayWriter.sync`.
+        """
+        eff.sync()
+
+    def log_effect(self, ref: dict[str, Any]) -> None:
+        """
+        After executing :py:meth:`.eval_effect`, update the persistent storage
+        with a reference to the latest exported simulation step, as returned by
+        :py:meth:`.XarrayTransducer.flush`.
+
+        Called by: :py:meth:`._write`.
+
+        Calls: :py:meth:`.update_attributes`.
+        """
+        self.update_attributes(NodePath(), {self.partition.log_attr_name: ref})
+
+    @abstractmethod
+    def update_attributes(self, path: NodePath, attrs: dict[str, Any], /) -> None:
+        """
+        Called by: :py:meth:`.log_effect` and :py:meth:`.mark_success`.
+        """
+        ...
+
+    def sync(self, *, shutdown: bool = False) -> None:
+        """
+        Synchronise the :py:attr:`.executor` thread and the :py:attr:`.store`
+        state.
+
+        Calls: :py:meth:`.update_transport`.
+        """
+        self.future.result()
+        if not shutdown:
+            self.update_transport()
+
+    @abstractmethod
+    def update_transport(self) -> None:
+        """
+        Update the backend-specific transport layer state, after
+        :py:meth:`._open_store` and after each :py:meth:`._write`.
+
+        Called by: :py:meth:`.sync`.
+        """
+        ...
+
+    @abstractmethod
+    def consolidate(self) -> None:
+        """
+        For performance reasons, the metadata of a storage backend may be in an
+        inconsistent state while a generation is being simulated, when no
+        external readers are expected. This method is responsible for restoring
+        metadata consistency at the end of each generation.
+        """
+        ...
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    def write(self, transducer: XarrayTransducer, *, final: bool) -> None:
+        """
+        Concurrently write a buffer to the open store, synchronising only at the
+        subsequent call.
+
+        Calls: :py:meth:`.XarrayTransducer.flush`, :py:meth:`.sync` and
+        :py:meth:`._write`.
+
+        Args:
+          final: Indicates the final buffer, which does not require copying.
+        """
+        assert self.num_writes >= 0
+        msg = transducer.flush(
+            # choose backend-specific encodings
+            self,
+            # emit coordinate data and encodings only with first trajectory buffer
+            include_static=(
+                self.partition.generation == 1 and self.num_writes == 0),
+            # final trajectory buffer does not require copying
+            final=final)
+        if self.num_writes > 0:
+            # finish writing previous buffer and update transport cache
+            self.sync()
+        self.future = self.executor.submit(self._write, *msg)
+        self.num_writes += 1
+
+    def _write(
+        self,
+        payload: DataTree,
+        encoding: dict[str, dict[str, VariableEncoding]],
+        ref: dict[str, Any], /
+    ) -> None:
+        """
+        This callable is scheduled on the :py:attr:`.executor` thread using
+        :py:meth:`~concurrent.futures.Executor.submit`. It expects as inputs the
+        outputs from :py:meth:`.XarrayTransducer.flush`.
+
+        Called by: :py:meth:`.write`.
+
+        Calls: :py:meth:`.make_effect`, :py:meth:`.eval_effect` and
+        :py:meth:`.log_effect`.
+        """
+        with filter_warnings(self._warnings_make_effect):
+            eff = self.make_effect(payload, encoding)
+        with filter_warnings(self._warnings_eval_effect):
+            self.eval_effect(eff)
+            self.log_effect(ref)
+
+    def mark_success(self) -> None:
+        """
+        Mark a cell division event in the store, as indicated by the caller of
+        :py:meth:`.BufferedEmitter.finalize`.
+        """
+        self.sync()
+        msg = {self.partition.success_attr_name: True}
+        self.update_attributes(NodePath(), msg)
+        self.num_writes = -1
diff --git a/ecoli/library/xarray_emitter/zarr_writer.py b/ecoli/library/xarray_emitter/zarr_writer.py
new file mode 100644
index 000000000..e5c9b0c54
--- /dev/null
+++ b/ecoli/library/xarray_emitter/zarr_writer.py
@@ -0,0 +1,801 @@
+
+"""
+Transport and session layers for the Zarr storage backend.
+
+This module defines subclasses that inherit from :py:mod:`.writer`, and modifies
+the internal state in Xarray and Zarr where necessary.
+"""
+
+
+from __future__ import annotations
+
+from asyncio import Semaphore, create_task, as_completed, gather
+from collections.abc import AsyncGenerator, Coroutine
+from collections import deque
+from dataclasses import replace
+from html import escape as html_escape
+from typing import Any, Mapping, final, cast
+import sys
+import warnings
+
+from xarray import DataTree
+from xarray.core.datatree import NodePath
+from xarray.backends import ZarrStore
+from xarray.backends.writers import dump_to_store
+
+import zarr
+from zarr.abc.codec import Codec
+from zarr.abc.numcodec import Numcodec
+from zarr.core.metadata import v2, v3
+from zarr.core._tree import TreeRepr
+from zarr.types import AnyAsyncArray
+from zarr.core.array import Array, AsyncArray
+from zarr.core.sync import sync
+from zarr.core.group import (
+    Group, AsyncGroup, GroupMetadata, ConsolidatedMetadata, _getitem_semaphore)
+from zarr.errors import ZarrUserWarning, UnstableSpecificationWarning
+
+from .utils import  WarningFilter, filter_warnings, emitter_arg_error
+from .writer import AsyncArrayWriter, AsyncBufferWriter
+from .storage import VariableSpec, VariableEncoding
+
+
+# ==============================================================================
+# constants
+# ==============================================================================
+
+
+ZARR_ASYNC_CONCURRENCY: int = 4
+""" Default bound on the number of Zarr's concurrent operations. """
+ZARR_MAX_WORKERS: int = 4
+""" Default bound on the size of Zarr's internal thread pool. """
+
+ZARR_FILTERS: dict[int, list[dict[str, Any]]] = {
+    2: [{"id": "delta", "dtype": None}],
+    3: [{"name": "numcodecs.delta", "configuration": {"dtype": None}}]
+}
+""" Default filter codecs, as a function of the Zarr format. """
+ZARR_COMPRESSORS: dict[int, list[dict[str, Any]]] = {
+    2: [{"id": "blosc", "cname": "zstd", "clevel": 6,
+         "shuffle": -1, "blocksize": 0}],
+    3: [{"name": "blosc", "configuration": {
+        "cname": "zstd", "clevel": 6,
+        "typesize": None, "shuffle": None, "blocksize": 0}}]
+}
+""" Default compression codecs, as a function of the Zarr format. """
+
+
+# ==============================================================================
+# Xarray internals
+# ==============================================================================
+
+
+def _datatree_to_zarr(
+    dt: DataTree, store: ZarrStore, encoding: Mapping[str, Any] | None = None, /
+) -> AsyncZarrArrayWriter:
+    """
+    Construct the :py:class:`.AsyncZarrArrayWriter` effect from a
+    :py:class:`~xarray.DataTree` to an already open
+    :py:class:`xarray.backends.ZarrStore`, possibly along some
+    :py:attr:`!xarray.backends.ZarrStore._append_dim`.
+
+    This function checks the following assumptions:
+
+    - No `Dask chunks`_ are used within ``dt``.
+    - In the first buffer, Zarr chunks are specified for all variables via
+      ``encoding``.
+    - In subsequent buffers, ``encoding`` is left empty.
+
+    Adapted from: :py:meth:`!xarray.backends.writers._datatree_to_zarr`.
+
+    .. _Dask chunks: https://docs.xarray.dev/en/stable/user-guide/dask.html
+    """
+    if encoding is None:
+        encoding = {}
+    if absolute := [p for p in encoding.keys() if p.startswith("/")]:
+        raise ValueError(f"unexpected absolute paths in `encoding`: {absolute}")
+    # TODO: fix in `_datatree_to_zarr()` (xarray==2026.04)
+    encoding = {f"/{p}": e for (p, e) in encoding.items()}
+    if unexpected := set(encoding.keys()) - set(dt.groups):
+        raise ValueError(
+            f"unexpected encoding group name(s) provided: {unexpected}")
+    if any(dt.chunksizes.values()):
+        raise ValueError("unexpected Dask chunks before Zarr export")
+
+    writer = AsyncZarrArrayWriter()
+    for (rel_path, node) in dt.subtree_with_keys:
+        # materialise a node
+        if not (len(node.dataset) or len(node.dataset.attrs)):
+            # skip nodes without any data or metadata, in order to avoid
+            # a failing check against `store._append_dim`
+            continue
+        elif node is dt:
+            # root node
+            ds = node.to_dataset(inherit=True)
+            node_store = store
+        else:
+            # descendant node: do not duplicate stored coordinates
+            ds = node.to_dataset(inherit=False)
+            node_store = store.get_child_store(rel_path)
+        # generate write operations for a node
+        ds = node_store._validate_and_autodetect_region(ds)
+        node_enc = encoding.get(node.path)
+        if node_enc is None and encoding:
+            raise KeyError(f"missing encoding for \"{node.path}\"")
+        # TODO: fix in `_datatree_to_zarr()` (xarray==2026.04)
+        node_store._validate_encoding(node_enc)
+        dump_to_store(ds, node_store, writer, encoding=node_enc)
+    return writer
+
+
+# ==============================================================================
+# Zarr internals
+# ==============================================================================
+
+
+async def consolidate_metadata(
+    group: AsyncGroup,
+) -> AsyncGroup:
+    """
+    Consolidate the metadata of all nodes in a hierarchy, including the root
+    node.
+
+    Adapted from: :py:func:`zarr.api.asynchronous.consolidate_metadata`.
+    """
+    # check store properties
+    assert isinstance(group, AsyncGroup)
+    assert group.store.supports_listing
+    assert group.store.supports_consolidated_metadata
+    group.store._check_writable()
+    assert group.metadata.consolidated_metadata is None
+
+    # traverse store and read all metadata
+    members_metadata = {
+        k: v.metadata
+        async for (k, v) in
+        group.members(max_depth=None, use_consolidated_for_children=False)}
+    # TODO: fix in `consolidate_metadata()` (zarr==3.1.6)
+    members_metadata |= {"": group.metadata}
+
+    # combine and write consolidated metadata
+    for k, v in members_metadata.items():
+        if isinstance(v, GroupMetadata) and v.consolidated_metadata is None:
+            members_metadata[k] = _replace_consolidated_metadata(
+                v, ConsolidatedMetadata(metadata={}))
+    ConsolidatedMetadata._flat_to_nested(members_metadata)
+    group = _replace_consolidated_metadata(
+        group, ConsolidatedMetadata(metadata=members_metadata))
+    await group._save_metadata()
+    return group
+
+
+async def reconsolidate_metadata(
+    group: AsyncGroup, modified_keys: set[str], added_keys: set[str], /
+) -> AsyncGroup:
+    """
+    Incrementally update consolidated metadata. Rather than recursing through
+    the entire store tree and recomputing the consolidated metadata afresh, load
+    the existing consolidated metadata, and update it with the current metadata
+    from a known list of modified and added paths.
+
+    Adapted from: :py:func:`zarr.api.asynchronous.consolidate_metadata`.
+    """
+    # check paths
+    assert isinstance(modified_keys, set)
+    assert isinstance(added_keys, set)
+    assert all(isinstance(k, str) for k in modified_keys)
+    assert all(isinstance(k, str) for k in added_keys)
+    assert modified_keys.isdisjoint(added_keys)
+
+    # check store properties
+    assert isinstance(group, AsyncGroup)
+    assert group.store.supports_listing
+    assert group.store.supports_consolidated_metadata
+    group.store._check_writable()
+    assert group.metadata.consolidated_metadata is not None
+
+    # read existing consolidated metadata
+    members_metadata = {
+        k: n.metadata
+        async for (k, n) in
+        group.members(max_depth=None, use_consolidated_for_children=True)}
+    for (_, v) in members_metadata.items():
+        if isinstance(v, GroupMetadata):
+            assert v.consolidated_metadata is not None
+
+    # read metadata at updated paths
+    group = _replace_consolidated_metadata(group, None)
+    mod_members_metadata, add_members_metadata = [
+        {k: n.metadata async for (k, n) in _iter_from_keys(group, keys)}
+        for keys in [modified_keys, added_keys]]
+
+    # check assumptions about metadata updates
+    old_keys = set(members_metadata.keys()) | {""}
+    assert set(mod_members_metadata.keys()).issubset(old_keys)
+    assert set(add_members_metadata.keys()).isdisjoint(old_keys)
+
+    # combine and write consolidated metadata
+    for metadata in [mod_members_metadata, add_members_metadata]:
+        for (k, v) in metadata.items():
+            if isinstance(v, GroupMetadata):
+                assert v.consolidated_metadata is None
+                metadata[k] = _replace_consolidated_metadata(
+                    v, ConsolidatedMetadata(metadata={}))
+    members_metadata |= mod_members_metadata | add_members_metadata
+    del old_keys, mod_members_metadata, add_members_metadata
+    # TODO: fix in `ConsolidatedMetadata._flat_to_nested()` (zarr==3.1.6)
+    members_metadata = dict(sorted(members_metadata.items(),
+                                   key=lambda kv: bfs_key(kv[0])))
+    ConsolidatedMetadata._flat_to_nested(members_metadata)
+    group = _replace_consolidated_metadata(
+        group, ConsolidatedMetadata(metadata=members_metadata))
+    await group._save_metadata()
+    return group
+
+
+def _replace_consolidated_metadata[NodeT: (AsyncGroup, GroupMetadata)](
+    node: NodeT, consolidated: ConsolidatedMetadata | None
+) -> NodeT:
+    match node:
+        case AsyncGroup():
+            _metadata = _replace_consolidated_metadata(node.metadata, consolidated)
+            return replace(node, metadata=_metadata)
+        case GroupMetadata():
+            assert isinstance(consolidated, ConsolidatedMetadata | None)
+            return replace(node, consolidated_metadata=consolidated)
+        case _:
+            raise ValueError(node)
+
+
+# ------------------------------------------------------------------------------
+
+
+async def _iter_from_keys(
+    node: AsyncGroup, keys: set[str], /
+) -> AsyncGenerator[tuple[str, AnyAsyncArray | AsyncGroup], None]:
+    """
+    Iterate over a known list of arrays and groups contained within a group,
+    returning relative paths and node objects.
+
+    Called by: :py:func:`.reconsolidate_metadata`.
+
+    Adapted from: :py:func:`!zarr.core.group._iter_members`.
+    """
+    semaphore = Semaphore(zarr.config.get("async.concurrency"))
+    node_tasks = tuple(
+        create_task(_getitem_semaphore(node, key, semaphore), name=key)
+        for key in keys)
+    for fetched_node_coro in as_completed(node_tasks):
+        try:
+            fetched_node = await fetched_node_coro
+        except KeyError as e:
+            warnings.warn(
+                f"Object at {e.args[0]} is not recognized as a component of a Zarr hierarchy.",
+                ZarrUserWarning, stacklevel=1)
+            continue
+        match fetched_node:
+            case AsyncArray() | AsyncGroup():
+                # remove prefix path, accommodating normalised root path
+                rel_path = fetched_node.name.removeprefix(node.name).removeprefix("/")
+                yield (rel_path, fetched_node)
+            case _:
+                raise ValueError(f"Unexpected type: {type(fetched_node)}")
+
+
+def bfs_key(path: str) -> tuple:
+    """
+    Corrected sorting key for the pre-processing step in
+    :py:meth:`!zarr.core.group.ConsolidatedMetadata._flat_to_nested`.
+
+    Called by: :py:func:`.reconsolidate_metadata`.
+    """
+    segments = path.split("/")
+    return (len(segments), *segments)
+
+
+# ------------------------------------------------------------------------------
+
+
+def group_tree(
+    group: Group,
+    level: int | None = None,
+    *,
+    max_nodes: int = 500,
+    plain: bool = False,
+) -> TreeRepr:
+    """
+    Adapted from: :py:meth:`!zarr.Group.tree`.
+
+    Calls: :py:func:`.group_tree_async`.
+    """
+    return sync(group_tree_async(
+        group._async_group,
+        max_depth=level, max_nodes=max_nodes, plain=plain))
+
+
+async def group_tree_async(
+    group: AsyncGroup,
+    max_depth: int | None = None,
+    *,
+    max_nodes: int = 500,
+    plain: bool = False,
+) -> TreeRepr:
+    """
+    Fix edge case with infinite recursion in
+    :py:func:`!zarr.core._tree.group_tree_async`.
+
+    Called by: :py:func:`.group_tree`.
+    """
+    members: list[tuple[str, Any]] = []
+    truncated = False
+    async for item in group.members(max_depth=max_depth):
+        if len(members) == max_nodes:
+            truncated = True
+            break
+        members.append(item)
+    members.sort(key=lambda key_node: key_node[0])
+
+    # Set up styling tokens: ANSI bold for terminals, HTML <b> for Jupyter,
+    # or empty strings when plain=True (useful for LLMs, logging, files).
+    if plain:
+        ansi_open = ansi_close = html_open = html_close = ""
+    else:
+        # Avoid emitting ANSI escape codes when output is piped or in CI.
+        use_ansi = sys.stdout.isatty()
+        ansi_open = "\x1b[1m" if use_ansi else ""
+        ansi_close = "\x1b[0m" if use_ansi else ""
+        html_open = "<b>"
+        html_close = "</b>"
+
+    # Group members by parent key so we can render the tree level by level.
+    nodes: dict[str, list[tuple[str, Any]]] = {}
+    for key, node in members:
+        # TODO: fix in `group_tree_async()` (zarr==3.1.6)
+        if key == "":
+            # avoid self-loop at root node
+            continue
+        elif key.count("/") == 0:
+            parent_key = ""
+        else:
+            parent_key = key.rsplit("/", 1)[0]
+        nodes.setdefault(parent_key, []).append((key, node))
+
+    # Render the tree iteratively (not recursively) to avoid hitting
+    # Python's recursion limit on deeply nested hierarchies.
+    # Each stack frame is (prefix_string, remaining_children_at_this_level).
+    text_lines = [f"{ansi_open}{group.name}{ansi_close}"]
+    html_lines = [f"{html_open}{html_escape(group.name)}{html_close}"]
+    stack = [("", deque(nodes.get("", [])))]
+    while stack:
+        prefix, remaining = stack[-1]
+        if not remaining:
+            stack.pop()
+            continue
+        key, node = remaining.popleft()
+        name = key.rsplit("/")[-1]
+        escaped_name = html_escape(name)
+        # if we popped the last item then remaining will
+        # now be empty - that's how we got past the if not remaining
+        # above, but this can still be true.
+        is_last = not remaining
+        connector = "└── " if is_last else "├── "
+        if isinstance(node, AsyncGroup):
+            text_lines.append(f"{prefix}{connector}{ansi_open}{name}{ansi_close}")
+            html_lines.append(f"{prefix}{connector}{html_open}{escaped_name}{html_close}")
+        else:
+            text_lines.append(
+                f"{prefix}{connector}{ansi_open}{name}{ansi_close} {node.shape} {node.dtype}"
+            )
+            html_lines.append(
+                f"{prefix}{connector}{html_open}{escaped_name}{html_close}"
+                f" {html_escape(str(node.shape))} {html_escape(str(node.dtype))}"
+            )
+        # Descend into children with an accumulated prefix:
+        # Example showing how prefix accumulates:
+        #   /
+        #   ├── a              prefix = ""
+        #   │   ├── b          prefix = "" + "│   "
+        #   │   │   └── x      prefix = "" + "│   " + "│   "
+        #   │   └── c          prefix = "" + "│   "
+        #   └── d              prefix = ""
+        #       └── e          prefix = "" + "    "
+        if children := nodes.get(key, []):
+            if is_last:
+                child_prefix = prefix + "    "
+            else:
+                child_prefix = prefix + "│   "
+            stack.append((child_prefix, deque(children)))
+    text = "\n".join(text_lines) + "\n"
+    html = "\n".join(html_lines) + "\n"
+    note = (
+        f"Truncated at max_nodes={max_nodes}, some nodes and their children may be missing\n"
+        if truncated
+        else ""
+    )
+    return TreeRepr(text, html, truncated=note)
+
+
+# ==============================================================================
+# array writer
+# ==============================================================================
+
+
+@final
+class AsyncZarrArrayWriter(AsyncArrayWriter[Array]):
+    """
+    Implementation of asynchronous write operations from in-memory Xarray data
+    structures to a Zarr store.
+    """
+
+    @property
+    def target_type(self) -> type[Array]:
+        return Array
+
+    def _sync(self, coro: Coroutine[None, None, None], /) -> None:
+        """
+        Run a coroutine on Zarr's event loop thread.
+        """
+        sync(coro)
+
+    async def _async(self) -> None:
+        """
+        Construct a coroutine using the :py:mod:`~zarr.api.asynchronous` Zarr
+        API.
+        """
+        # wait for all write operations to finish
+        await gather(*(
+            # acceess the async array API
+            t.async_array.setitem(r, s)
+            # iterate over write operations
+            for (s, t, r) in zip(self.sources, self.targets, self.regions)))
+
+
+# ==============================================================================
+# buffer writer
+# ==============================================================================
+
+
+@final
+class AsyncZarrBufferWriter(AsyncBufferWriter[ZarrStore]):
+    """
+    Session layer for writing :py:class:`.XarrayBuffer` contents to a persistent
+    Zarr store.
+
+    Within each simulation, the Zarr store handle is reused and data is
+    `appended`_ along the time dimension. After the simulation has finished,
+    `consolidated metadata`_ is either created or updated.
+
+    Example JSON configuration::
+
+      {
+        "format": 3,
+        "async.concurrency": 3,
+        "threading.max_workers": 3
+      }
+
+    Here,
+
+      - ``format`` is an explicit choice of the `Zarr format`_,
+      - and the other options are forwarded to the `Zarr concurrency
+        configuration`_.
+
+    .. hint::
+      The Zarr :py:mod:`~zarr.api.asynchronous` API is used for writing *data
+      variables* during a simulation, but the :py:mod:`~zarr.api.synchronous`
+      API is still used to write *metadata attributes* at the beginning and end
+      of the simulation. Once Xarray's ``async`` support has `matured`_, it
+      should be fully leveraged.
+
+    .. note::
+      Zarr is currently configured to use the Rust pipeline `zarrs-python`_ for
+      performance. However, the `numcodecs`_ compression used as a default in
+      :py:meth:`.var_codecs` is currently not supported by `zarrs-python`_, and
+      therefore, variables using such codecs will fall back to the
+      `zarr-python`_ implementation. These choices need to be revisited at a
+      later point, based on profiling of large-scale simulations.
+
+    .. _appended: https://docs.xarray.dev/en/stable/user-guide/io.html#modifying-existing-zarr-stores
+    .. _consolidated metadata: https://docs.xarray.dev/en/stable/user-guide/io.html#io-zarr-consolidated-metadata
+    .. _Zarr format: https://zarr.readthedocs.io/en/stable/user-guide/v3_migration/
+    .. _Zarr concurrency configuration: https://zarr.readthedocs.io/en/stable/user-guide/performance/#parallel-computing-and-synchronization
+    .. _matured: https://github.com/pydata/xarray/issues/10622
+    .. _zarrs-python: https://github.com/zarrs/zarrs-python
+    .. _numcodecs: https://numcodecs.readthedocs.io/en/stable/
+    .. _zarr-python: https://github.com/zarr-developers/zarr-python
+    """
+
+    @classmethod
+    def validate_config(cls, config: dict[str, Any], /) -> None:
+        super().validate_config(config)
+        zarr_config = config["backend_config"]
+        match zarr_config.get("format"):
+            case None:
+                raise KeyError(emitter_arg_error(
+                    cls, "Missing argument",
+                    "\"writer\": {\"backend_config\": {\"format\": ...}}"))
+            case 2 | 3:
+                pass
+            case fmt:
+                raise ValueError(emitter_arg_error(
+                    cls, "Invalid Zarr format",
+                    f"\"writer\": {{\"backend_config\": {{\"format\": {fmt}}}}}"))
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @property
+    def group(self) -> Group:
+        return self.store.zarr_group
+
+    def _open_group(self) -> Group:
+        """
+        Open Zarr API handles.
+
+        Called by: :py:meth:`._open_store`.
+
+        Calls: :py:func:`zarr.open_group`.
+        """
+        return zarr.open_group(
+            # URI for global store holding entire workflow
+            self.config["store"],
+            # independent substore holding current simulation subensemble
+            path=str(self.partition.independent_path),
+            # enforce explicit format choice
+            zarr_format=self.config["backend_config"]["format"],
+            # load consolidated metadata from previous generations
+            use_consolidated=True,
+            # only allow appending
+            mode="a",
+        )
+
+    def _check_group(self, group: Group) -> Group:
+        """
+        Perform basic consistency checks on the persistent storage state.
+
+        Called by: :py:meth:`._open_store`.
+        """
+        if self.partition.generation == 1:
+            if group.nmembers() > 0:
+                raise FileExistsError(
+                    f"({type(self).__name__})\n"
+                    f"  Path for new independent substore already exists:\n"
+                    f"    {group.store_path}")
+        else:
+            parent = self.partition.parent
+            try:
+                assert isinstance(group[parent.time_coo_name], Array)
+            except KeyError:
+                raise FileNotFoundError(
+                    f"({type(self).__name__})\n"
+                    f"  Missing path from previous generation:\n"
+                    f"    {group.store_path / parent.time_coo_name}")
+            if not group.attrs.get(parent.success_attr_name, False):
+                raise ValueError(
+                    f"({type(self).__name__})\n"
+                    f"  Missing cell division event from previous generation:\n"
+                    f"    {parent.success_attr_name}")
+        return group
+
+    def _cache_consolidated_metadata(self, group: Group) -> Group:
+        """
+        Read consolidated metadata from persistent storage, and hide it from the
+        Zarr API, before it either interferes with, or is overwritten by, new
+        emits. The cached value is later used by :py:meth:`.consolidate`.
+
+        Called by: :py:meth:`._open_store`.
+        """
+        self.consolidated_metadata = group.metadata.consolidated_metadata
+        if self.partition.generation == 1:
+            assert self.consolidated_metadata is None
+        else:
+            assert self.consolidated_metadata is not None
+            async_group = _replace_consolidated_metadata(group._async_group, None)
+            group = replace(group, _async_group=async_group)
+        return group
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @property
+    def store_type(self) -> type[ZarrStore]:
+        return ZarrStore
+
+    def _open_store(self) -> ZarrStore:
+        """
+        Configure the Zarr transport layer and open Xarray API handles.
+
+        Called by: :py:meth:`.AsyncBufferWriter.open_store`.
+
+        Calls: :py:meth:`._open_group`, :py:meth:`._check_group`,
+        :py:meth:`._cache_consolidated_metadata`.
+        """
+        zarr_config = self.config["backend_config"]
+        zarr.config.update({
+            "async.concurrency": zarr_config.get(
+                "async.concurrency", ZARR_ASYNC_CONCURRENCY),
+            "threading.max_workers": zarr_config.get(
+                "threading.max_workers", ZARR_MAX_WORKERS),
+            # skip overhead of fill value checks
+            "array.write_empty_chunks": True,
+            "codec_pipeline": {
+                # use `zarrs-python`
+                "path": "zarrs.ZarrsCodecPipeline",
+                # limit array-level parallelism
+                "batch_size": 1,
+                # subordinate to `threading.max_workers`
+                "chunk_concurrent_minimum": 1,
+                "chunk_concurrent_maximum": None,
+                # prioritise robustness across formats and platforms
+                "validate_checksums": True,
+                "strict": False,
+                "direct_io": False,
+            }
+        })
+        return ZarrStore(
+            self._cache_consolidated_metadata(
+                self._check_group(self._open_group())),
+            # only allow appending along time axis
+            mode="a-",
+            # manage cache updates in `self.update_transport()`
+            cache_members=True,
+            # consolidate only after simulation finishes through Zarr API,
+            # rather than after every write through Xarray API
+            consolidate_on_close=False,
+            # finalise Zarr API
+            close_store_on_close=True,
+        )
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    def coo_codecs(self, var: VariableSpec, /) -> VariableEncoding:
+        """
+        Currently, no Zarr codecs are applied to coordinate arrays.
+        """
+        return {}
+
+    def var_codecs(self, var: VariableSpec, /) -> VariableEncoding:
+        """
+        Parse the Zarr codecs for a simulation variable, if they are specified
+        in the JSON config, and otherwise, apply the default codecs.
+        """
+        z: int = self.group.metadata.zarr_format
+        if var.codecs:
+            # fetch variable-specific JSON config
+            _filters = var.codecs.get(f"filters_v{z}", [])
+            _compressors = var.codecs.get(f"compressors_v{z}", [])
+            if not (_filters or _compressors):
+                raise ValueError(emitter_arg_error(
+                    self, "Missing arguments",
+                    f"...: {{\"codecs\": "
+                    f"{{\"filters_v{z}\": ..., \"compressors_v{z}\": ...}}}}"))
+        else:
+            # fetch default config and supply variable-specific information
+            _filters = ZARR_FILTERS[z]
+            _compressors = ZARR_COMPRESSORS[z]
+            for f in _filters:
+                if z == 2:
+                    f["dtype"] = var.dtype
+                else:
+                    f["configuration"]["dtype"] = var.dtype
+        # parse codec config
+        filters: tuple[Codec | Numcodec, ...] | None
+        compressors: tuple[Codec | Numcodec | None, ...]
+        with filter_warnings(self._warnings_make_effect):
+            if z == 2:
+                filters = v2.parse_filters(_filters)
+                compressors = tuple(map(v2.parse_compressor, _compressors))
+            else:
+                filters = v3.parse_codecs(_filters)
+                compressors = v3.parse_codecs(_compressors)
+        return {"filters": filters, "compressors": compressors}
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @classmethod
+    def warnings_make_effect(cls) -> list[WarningFilter]:
+        return [
+            WarningFilter(
+                module="zarr.api.asynchronous",
+                category=ZarrUserWarning,
+                message="Consolidated metadata.*Zarr format 3",
+                action="ignore"),
+            WarningFilter(
+                module="zarr.core.dtype.npy.string",
+                category=UnstableSpecificationWarning,
+                message=".*data type.*Zarr V3",
+                action="ignore"),
+            WarningFilter(
+                module="zarr.codecs.numcodecs",
+                category=ZarrUserWarning,
+                message=".*Numcodecs codecs.*Zarr version 3",
+                action="ignore"),
+            WarningFilter(
+                module="zarrs.pipeline",
+                category=UserWarning,
+                message="Array is unsupported by ZarrsCodecPipeline",
+                action="ignore")]
+
+    @classmethod
+    def warnings_eval_effect(cls) -> list[WarningFilter]:
+        return [
+            WarningFilter(
+                module="zarrs.pipeline",
+                category=UserWarning,
+                message="Array is unsupported by ZarrsCodecPipeline",
+                action="ignore")]
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @staticmethod
+    def to_zarr_path(path: NodePath) -> str:
+        return "" if path == NodePath() else str(path)
+
+    def get_zarr_path(self, path: NodePath) -> Group:
+        assert isinstance(path, NodePath)
+        return (self.group if path == NodePath()
+                else cast(Group, self.group[self.to_zarr_path(path)]))
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    def merge_attributes(self, payload: DataTree) -> None:
+        """
+        Combine attributes from the existing Zarr store and the Xarray buffer
+        update at :py:attr:`.XarrayBuffer.modified_paths`.
+        """
+        for path in self.buffer.modified_paths:
+            # empty in-memory attribute containers do not produce write operations
+            if (xr_attrs := payload._get_item(path).attrs):
+                zr_attrs = dict(self.get_zarr_path(path).attrs)
+                payload._get_item(path).attrs = zr_attrs | xr_attrs
+
+    def make_effect(
+        self, payload: DataTree, encoding: Mapping[str, Any], /
+    ) -> AsyncZarrArrayWriter:
+        """
+        Calls: :py:func:`._datatree_to_zarr`.
+        """
+        return _datatree_to_zarr(payload, self.store, encoding)
+
+    def update_attributes(self, path: NodePath, attrs: dict[str, Any], /) -> None:
+        self.get_zarr_path(path).update_attributes(attrs)
+
+    def update_transport(self) -> None:
+        """
+        After writing the first buffer for a generation, emulate reinstantiating
+        the :py:class:`xarray.backends.ZarrStore` by updating its cache, and
+        enforce that subsequent writes can only append along the
+        generation-specific time axis.
+        """
+        assert self.group.metadata.consolidated_metadata is None
+        assert self.num_writes > 0
+        if self.num_writes == 1:
+            with filter_warnings(self._warnings_eval_effect):
+                # find direct children in the Zarr hierarchy
+                self.store._members = self.store._fetch_members()
+            # set appending axis
+            self.store._append_dim = self.partition.time_coo_name
+            assert self.store._append_dim in self.store.get_dimensions()
+        assert len(self.store.members)
+
+    def consolidate(self) -> None:
+        """
+        Update existing consolidated metadata in the Zarr store with the outputs
+        of a newly finished simulation.
+
+        Calls: :py:func:`zarr.consolidate_metadata` or
+        :py:func:`.reconsolidate_metadata`.
+        """
+        assert self.group.metadata.consolidated_metadata is None
+        with filter_warnings(self._warnings_make_effect):
+            if self.partition.generation == 1:
+                # create from scratch, calling `Store.list_dir()` recursively
+                assert self.consolidated_metadata is None
+                sync(consolidate_metadata(self.group._async_group))
+            else:
+                # retrieve cached consolidated metadata from previous generations
+                assert self.consolidated_metadata is not None
+                async_group: AsyncGroup = _replace_consolidated_metadata(
+                    self.group._async_group, self.consolidated_metadata)
+                # combine with metadata for new paths
+                sync(reconsolidate_metadata(
+                    async_group,
+                    set(map(self.to_zarr_path, self.buffer.modified_paths)),
+                    set(map(self.to_zarr_path, self.buffer.added_paths))))
diff --git a/ecoli/processes/engine_process.py b/ecoli/processes/engine_process.py
index c7bea28da..d25c2d7e7 100644
--- a/ecoli/processes/engine_process.py
+++ b/ecoli/processes/engine_process.py
@@ -1,4 +1,4 @@
-"""
+r"""
 =============
 EngineProcess
 =============
@@ -93,10 +93,10 @@
 from vivarium.core.store import DEFAULT_SCHEMA, Store
 from vivarium.library.topology import get_in
 
-from ecoli.library.parquet_emitter import ParquetEmitter
 from ecoli.library.sim_data import RAND_MAX
 from ecoli.library.schema import remove_properties, empty_dict_divider, not_a_process
 from ecoli.library.updaters import inverse_updater_registry
+from ecoli.library.parquet_emitter import BufferedEmitter
 from ecoli.processes.cell_division import daughter_phylogeny_id
 
 
@@ -312,12 +312,13 @@ def __init__(self, parameters=None):
         # Only apply overrides to first cell in simulation
         self.parameters["inner_composer_config"].pop("initial_state_overrides", None)
 
+        # Only emit designated stores if specified
         if self.parameters["emit_paths"]:
-            self.sim.state.set_emit_values([tuple()], False)
-            self.sim.state.set_emit_values(
-                self.parameters["emit_paths"],
-                True,
-            )
+            if self.parameters["inner_emitter"] not in ("parquet", "xarray"):
+                state = self.sim.state
+                state.set_emit_value(emit=False, path=tuple())
+                state.set_emit_values(emit=True, paths=self.parameters["emit_paths"])
+
         self.random_state = np.random.RandomState(seed=self.parameters["seed"])
 
         self.updater_registry_reverse = {
@@ -340,6 +341,14 @@ def create_emitter(self):
         self.emitter_config["experiment_id"] = self.parameters["experiment_id"]
         self.emitter = get_emitter(self.emitter_config)
 
+        # Only emit designated stores if specified
+        if isinstance(self.emitter, BufferedEmitter):
+            assert self.parameters["inner_emitter"] in ("parquet", "xarray")
+            self.emitter.reset_emit_flags(
+                engine=self.sim,
+                agent=("agents", self.parameters["agent_id"]),
+                emit_paths=self.parameters["emit_paths"])
+
     def ports_schema(self):
         schema = {
             "agents": {},
@@ -510,7 +519,7 @@ def next_update(self, timestep, states):
             if force_complete:
                 self.sim.complete()
         except (Exception, KeyboardInterrupt):
-            if isinstance(self.emitter, ParquetEmitter):
+            if isinstance(self.emitter, BufferedEmitter):
                 self.emitter.finalize()
             raise
 
@@ -523,7 +532,7 @@ def next_update(self, timestep, states):
         ).get_value()
         if self.parameters["divide"] and division_variable >= division_threshold:
             # Finalize emits before division
-            if isinstance(self.emitter, ParquetEmitter):
+            if isinstance(self.emitter, BufferedEmitter):
                 self.emitter.success = True
                 self.emitter.finalize()
             # Perform division.
diff --git a/ecoli/processes/listeners/mass_listener.py b/ecoli/processes/listeners/mass_listener.py
index e23121c82..52d3d623d 100644
--- a/ecoli/processes/listeners/mass_listener.py
+++ b/ecoli/processes/listeners/mass_listener.py
@@ -121,7 +121,7 @@ def __init__(self, parameters=None):
         if self.compartment_abbrev_to_index:
             self._bulk_molecule_by_compartment = np.stack(
                 [
-                    np.core.defchararray.chararray.endswith(self.bulk_ids, abbrev + "]")
+                    np._core.defchararray.chararray.endswith(self.bulk_ids, abbrev + "]")
                     for abbrev in self.compartment_abbrev_to_index
                 ]
             )
@@ -272,7 +272,7 @@ def next_update(self, timestep, states):
 
             massDiffs = np.array(list(attrs(molecules, self.massDiff_names))).T
             if self.match_wcecoli:
-                massDiffs = np.core.records.fromarrays(
+                massDiffs = np._core.records.fromarrays(
                     attrs(molecules, self.massDiff_names)
                 ).view((np.float64, len(self.massDiff_names)))
             unique_submasses += massDiffs.sum(axis=0)
diff --git a/pyproject.toml b/pyproject.toml
index 26d279536..81559e902 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -34,6 +34,14 @@ dependencies = [
     "ortools<9.11",
     "pandas",
     "polars",
+    "xarray>=2026.04",
+    # concurrency control in `ecoli.library.xarray_emitter.zarr_writer`
+    # might require adjustments for `zarr>=3.2`:
+    # https://ossci.zulipchat.com/#narrow/channel/423692-Zarr/topic/3.2E2.2E0.20release
+    "zarr~=3.1.6",
+    "zarrs>=0.2",
+    # future consumers of `xarray_emitter`
+    # "cubed>=0.26",
     "pymunk",
     "scikit-image",
     "scikit-learn",
diff --git a/pytest.ini b/pytest.ini
index d2171d0ae..d954d1b4e 100644
--- a/pytest.ini
+++ b/pytest.ini
@@ -10,3 +10,9 @@ markers =
     slow: indicates slow tests (deselect with '-m "not slow"')
     noci: indicates tests that should not run on CI (e.g. because they are too slow)
     master: indicates tests that should only run on master
+    basic_workflow: selects a subset of 'MockEcoliSimWorkflow' tests for development
+tmp_path_retention_policy = failed
+tmp_path_retention_count = 1
+filterwarnings =
+    ignore::DeprecationWarning:multiprocessing.popen_fork
+    ignore::DeprecationWarning:vivarium.core.composition
diff --git a/runscripts/test_workflow.py b/runscripts/test_workflow.py
index 7e6bbb28a..741306e09 100644
--- a/runscripts/test_workflow.py
+++ b/runscripts/test_workflow.py
@@ -1,7 +1,9 @@
+
 """
-Tests for Nextflow workflow generation in workflow.py
+Tests for Nextflow workflow generation in :py:mod:`runscripts.workflow`, and a
+mock class for workflow execution that can be used by other test modules.
 
-These tests verify the correctness of:
+The tests verify the correctness of:
 - Channel grouping templates (MULTIDAUGHTER_CHANNEL, MULTIGENERATION_CHANNEL, etc.)
 - Analysis batching logic with group_size for cache invalidation
 - Full workflow generation via --build-only
@@ -17,21 +19,305 @@
 import shutil
 import subprocess
 import uuid
+import sys
+from dataclasses import dataclass, field
 from pathlib import Path
 from unittest.mock import patch
 
 import pytest
 
+from vivarium.core.store import Store
+from vivarium.core.engine import Engine
+
+from ecoli.library.test_utils import PatchConfig, patch_func, patch_meth
+from ecoli.library.emitter import StoragePartition
+from ecoli.processes.cell_division import DivisionDetected, daughter_phylogeny_id
+from ecoli.experiments.ecoli_master_sim import CONFIG_DIR_PATH, SimConfig, EcoliSim
+
 from runscripts.workflow import (
     generate_lineage,
     generate_code,
 )
 
-# Constants for test calculations
+
+# mypy: disable-error-code="attr-defined"
+
+
+# ==============================================================================
+# constants
+# ==============================================================================
+
+
 # The mock createVariants stub always produces 3 variants
 MOCK_NUM_VARIANTS = 3
 
 
+# ==============================================================================
+# mock workflow
+# ==============================================================================
+
+
+@dataclass(kw_only=True, slots=True)
+class MockEcoliSimWorkflow:
+    """
+    Mock class for emulating the orchestration of a single-variant, single-seed,
+    multi-generation, single-lineage simulation via the templated Nextflow
+    workflow, as triggered by :py:func:`runscripts.workflow.main`. Instead of
+    using Nextflow, this mock class runs on a single Python process inside a
+    temporary directory, and it incurs only a small fraction of the simulation
+    cost required for actually reaching cell division.
+
+    For documentation on the functionality being mocked, see :ref:`workflows`
+    and :ref:`experiment_output`.
+
+    The following CLI arguments for
+    :py:func:`ecoli.experiments.ecoli_master_sim.main` are handled explicitly,
+    via attributes and methods of this mock class:
+
+      - ``--config``
+      - ``--sim_data_path``
+      - ``--daughter_outdir``
+      - ``--initial_state_file``
+      - ``--agent_id``
+      - ``--initial_global_time``
+      - ``--lineage_seed``
+      - ``--seed``
+      - ``--emitter``
+      - ``--emitter_arg``
+
+    The following CLI arguments for
+    :py:func:`ecoli.experiments.ecoli_master_sim.main` are not represented in
+    this mock class:
+
+      - ``--variant``
+    """
+
+    #: Pytest fixture for modifying the execution environment.
+    monkeypatch: pytest.MonkeyPatch
+    #: Unique temporary working directory for this mock workflow.
+    workdir: Path
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    #: Stem of the baseline JSON configuration file.
+    config_name: str
+    #: - ``configs/test_configs/{config_name}.json``.
+    #: - Emulates the Nextflow input variable ``config_uri``.
+    #: - Passed to :py:class:`.EcoliSim` via the CLI argument ``--config``.
+    config_file: Path = field(init=False)
+    #: - Emulates the Nextflow input variable ``sim_data_uri``.
+    #: - Passed to :py:class:`.EcoliSim` via the CLI argument ``--sim_data_path``.
+    sim_data_path: Path
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    #: - Emulates the Nextflow local variable ``daughter_outdir``.
+    #: - Passed to :py:class:`.EcoliSim` via the CLI argument
+    #:   ``--daughter_outdir``.
+    daughter_outdir: Path
+    #: File inside :py:attr:`.daughter_outdir` that is exported by
+    #: :py:meth:`.EcoliSim.persist_generation`.
+    initial_state_name: str = "daughter_state_0.json"
+    #: - ``{daughter_outdir}/{initial_state_name}``.
+    #: - Emulates the Nextflow input variable ``initial_state_uri``.
+    #: - Passed back to :py:class:`.EcoliSim` via the CLI argument
+    #:   ``--initial_state_file``.
+    initial_state_file: Path = field(init=False)
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    #: - Emulates the Nextflow input variable ``agent_id``.
+    #: - Initialised in :py:func:`runscripts.workflow.generate_lineage`.
+    #: - Passed to :py:class:`.EcoliSim` via the CLI argument ``--agent_id``.
+    agent_id: str = '0'
+    #: - Emulates the Nextflow input variable ``generation``.
+    #: - Initialised in :py:func:`runscripts.workflow.generate_lineage`.
+    #: - Computed by :py:class:`.EcoliSim` as ``len(agent_id)`` in
+    #:   :py:class:`.StoragePartition`.
+    generation: int = 1
+    #: - Environment variable exported by :py:meth:`.EcoliSim.persist_generation`.
+    #: - Emulates the Nextflow input variable ``prev_division_time``.
+    #: - Passed back to :py:class:`.EcoliSim` via the CLI argument
+    #:   ``--initial_global_time``.
+    division_time: float = .0
+    #: - Emulates the Nextflow input variable ``lineage_seed``.
+    #: - Passed to :py:class:`.EcoliSim` via the CLI argument ``--lineage_seed``.
+    lineage_seed: int
+    #: - Emulates the Nextflow input variable ``sim_seed``.
+    #: - Passed to :py:class:`.EcoliSim` via the CLI argument ``--seed``.
+    sim_seed: int = field(init=False)
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    #: - Emitter configuration under test.
+    #: - Passed to :py:class:`.EcoliSim` via the CLI arguments
+    #:   ``--emitter`` and ``--emitter_arg``.
+    emitter_config: PatchConfig
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    #: Emulates the Nextflow process for a single generation.
+    sim: EcoliSim | None = None
+    #: Internal flag, unset at the generation that doesn't reach cell division.
+    prev_success: bool = True
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    def __post_init__(self) -> None:
+        """
+        Set the working directory, I/O file paths, and the initial seed.
+        """
+        # use a temporary working directory to contain workflow artefacts, e.g.,
+        # local files written by `ecoli.experiments.EcoliSim.persist_generation()`
+        self.monkeypatch.chdir(self.workdir)
+
+        # find a baseline JSON config
+        self.config_file = (
+            Path(CONFIG_DIR_PATH) / "test_configs" / f"{self.config_name}.json")
+        assert self.config_file.exists()
+
+        # find a `simData` in the repository
+        assert isinstance(self.sim_data_path, Path)
+        assert self.sim_data_path.is_absolute()
+        assert self.sim_data_path.exists()
+
+        # set the local path for daughter state
+        # - stored by: `ecoli.experiments.EcoliSim.persist_generation()`
+        # - loaded by: `ecoli.composites.ecoli_master.Ecoli.initial_state()`
+        assert isinstance(self.daughter_outdir, Path)
+        assert self.daughter_outdir.is_absolute()
+        self.daughter_outdir.mkdir(exist_ok=False)
+        self.initial_state_file = self.daughter_outdir / self.initial_state_name
+
+        # initialise the seed stream, emulating:
+        # `runscripts/nextflow/sim.nf::simGen0().script`
+        assert isinstance(self.lineage_seed, int)
+        self.sim_seed = self.lineage_seed
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    def init_sim(self, success: bool, /) -> EcoliSim:
+        """
+        Create a new simulator instance, in the emulated environment of a call
+        to :py:func:`ecoli.experiments.ecoli_master_sim.main` from the Nextflow
+        process of a new generation, and additionally apply
+        :py:attr:`.emitter_config` as well as the method patches required to
+        achieve the mock behaviour.
+
+        Called by: :py:meth:`.sim_gen`.
+
+        Args:
+            success: Flag for emulating a :py:exc:`.DivisionDetected` event.
+        """
+        # configure the baseline simulation
+        config = SimConfig()
+        config.update_from_json(str(self.config_file))
+        config.update_from_dict({
+            "sim_data_path": str(self.sim_data_path),
+            "daughter_outdir": str(self.daughter_outdir)})
+
+        # configure the generation state
+        config.update_from_dict({
+            "agent_id": self.agent_id,
+            "lineage_seed": self.lineage_seed,
+            "seed": self.sim_seed})
+        if self.generation > 1:
+            config.update_from_dict({
+                "initial_global_time": self.division_time,
+                "initial_state_file": str(self.initial_state_file)})
+
+        # configure the emitter parameters
+        config.update_from_dict(self.emitter_config.to_dict())
+
+        # construct the simulation state
+        sim = EcoliSim(config.to_dict())
+        with patch_func("ecoli.composites.ecoli_master.get_state_from_file") as f:
+            sim.build_ecoli()
+            if self.generation == 1:
+                f.assert_not_called()
+            else:
+                f.assert_called_once_with(path=str(self.initial_state_file))
+
+        # emulate the effects of reaching cell division
+        def update_experiment(_self: EcoliSim, _) -> None:
+            engine = _self.ecoli_experiment
+
+            # method called conditionally on exception `DivisionDetected`
+            def persist_generation(_: EcoliSim, *, num_agents: int = 2) -> tuple:
+                nonlocal self, engine
+                # emulate the environment variable `division_time`
+                self.division_time = engine.global_time
+                # mock agent division for single-daughter lineage
+                agents = engine.state.get_path(("agents",))
+                assert isinstance(agents, Store)
+                assert list(agents.inner.keys()) == [self.agent_id]
+                daughter_id = daughter_phylogeny_id(self.agent_id)[0]
+                daughter_state = agents.get_path((self.agent_id,))
+                agents.inner = {daughter_id: daughter_state}
+                # expect 1 agent in the wrapped method
+                assert num_agents == 2
+                return ((), {"num_agents": 1})
+            patch_meth(_self, "persist_generation", modargs=persist_generation)
+
+            # patch applied conditionally on test flag `success`
+            nonlocal success
+            if success:
+                # simulate until `config["max_duration"]` and then raise
+                def _check_complete(_: Engine):
+                    raise DivisionDetected
+                patch_meth(engine, "_check_complete", cb=_check_complete)
+        patch_meth(sim, "update_experiment", cb=update_experiment)
+        return sim
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    def sim_gen(self, success: bool, /) -> StoragePartition:
+        """
+        Emulate ``runscripts/nextflow/sim.nf::{simGen0,sim}()`` by starting a
+        single-generation simulation, stopping at ``config["max_duration"]``,
+        and storing the resulting cell state to disk, without waiting for an
+        actual cell division.
+
+        Calls: :py:meth:`.init_sim`.
+
+        Args:
+            success: Flag for emulating a :py:exc:`.DivisionDetected` event.
+        """
+        # sanity check the mock generation state
+        assert self.sim is None
+        assert self.prev_success
+        assert len(self.agent_id) == self.generation
+        assert self.sim_seed - self.lineage_seed == self.generation - 1
+
+        # emulate `ecoli_master_sim.main()`
+        self.sim = self.init_sim(success)
+        with self.monkeypatch.context() as mp:
+            # skip `sys.exit()` inside `EcoliSim.update_experiment()`
+            mp.setattr(sys, "exit", lambda: None)
+            self.sim.run()
+
+        # sanity check the patching logic
+        u, p = self.sim.update_experiment, self.sim.persist_generation
+        u.assert_called_once_with(self.sim.max_duration)
+        p.assert_called_once_with() if success else p.assert_not_called()
+
+        # finalise the mock generation state
+        partition = self.sim.ecoli_experiment.emitter.partition
+        self.sim = None
+        self.prev_success = success
+
+        # emulate the generation transition in Nextflow variables
+        self.agent_id += "0"
+        self.generation += 1
+        self.sim_seed += 1
+        return partition
+
+
+# ==============================================================================
+# Nextflow tests
+# ==============================================================================
+
+
 class TestGenerateLineage:
     """Test the generate_lineage function output."""
 
@@ -197,6 +483,9 @@ def test_sims_per_seed_calculation_full_tree(self):
         assert "size: 7" in workflow_str
 
 
+# ------------------------------------------------------------------------------
+
+
 class TestGenerateCode:
     """Test the generate_code function."""
 
@@ -237,6 +526,9 @@ def test_without_sim_data_path_runs_parca(self):
         assert "runParca(params.config)" in run_parca
 
 
+# ------------------------------------------------------------------------------
+
+
 @pytest.fixture
 def temp_config_dir(tmp_path):
     """Create a temporary directory for test configs."""
@@ -780,6 +1072,9 @@ def test_stub_sim_data_path_skips_parca(self, temp_config_dir):
                 shutil.rmtree(out_dir)
 
 
+# ------------------------------------------------------------------------------
+
+
 class TestGroupSizeValues:
     """Test that group_size values are calculated correctly for different configurations."""
 
@@ -989,5 +1284,8 @@ def test_group_size_formulas(self, generations, n_init_sims, single_daughters):
             )
 
 
+# ------------------------------------------------------------------------------
+
+
 if __name__ == "__main__":
     pytest.main([__file__, "-v"])
diff --git a/uv.lock b/uv.lock
index 6d35fbc52..dcd0434a9 100644
--- a/uv.lock
+++ b/uv.lock
@@ -748,6 +748,18 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/8f/d7/9322c609343d929e75e7e5e6255e614fcc67572cfd083959cdef3b7aad79/docutils-0.21.2-py3-none-any.whl", hash = "sha256:dafca5b9e384f0e419294eb4d2ff9fa826435bf15f15b7bd45723e8ad76811b2", size = 587408, upload-time = "2024-04-23T18:57:14.835Z" },
 ]
 
+[[package]]
+name = "donfig"
+version = "0.8.1.post1"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "pyyaml" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/25/71/80cc718ff6d7abfbabacb1f57aaa42e9c1552bfdd01e64ddd704e4a03638/donfig-0.8.1.post1.tar.gz", hash = "sha256:3bef3413a4c1c601b585e8d297256d0c1470ea012afa6e8461dc28bfb7c23f52", size = 19506, upload-time = "2024-05-23T14:14:31.513Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/0c/d5/c5db1ea3394c6e1732fb3286b3bd878b59507a8f77d32a2cebda7d7b7cd4/donfig-0.8.1.post1-py3-none-any.whl", hash = "sha256:2a3175ce74a06109ff9307d90a230f81215cbac9a751f4d1c6194644b8204f9d", size = 21592, upload-time = "2024-05-23T14:13:55.283Z" },
+]
+
 [[package]]
 name = "duckdb"
 version = "1.4.4"
@@ -2241,6 +2253,23 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/68/1d/ddb3e704c5a8fb90142bf9dc195c27db02a08a99f037395503bfbc1d14b3/numba-0.61.2-cp312-cp312-win_amd64.whl", hash = "sha256:97cf4f12c728cf77c9c1d7c23707e4d8fb4632b46275f8f3397de33e5877af18", size = 2831929, upload-time = "2025-04-09T02:57:58.45Z" },
 ]
 
+[[package]]
+name = "numcodecs"
+version = "0.16.5"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "numpy" },
+    { name = "typing-extensions" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/44/bd/8a391e7c356366224734efd24da929cc4796fff468bfb179fe1af6548535/numcodecs-0.16.5.tar.gz", hash = "sha256:0d0fb60852f84c0bd9543cc4d2ab9eefd37fc8efcc410acd4777e62a1d300318", size = 6276387, upload-time = "2025-11-21T02:49:48.986Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/75/cc/55420f3641a67f78392dc0bc5d02cb9eb0a9dcebf2848d1ac77253ca61fa/numcodecs-0.16.5-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:24e675dc8d1550cd976a99479b87d872cb142632c75cc402fea04c08c4898523", size = 1656287, upload-time = "2025-11-21T02:49:25.755Z" },
+    { url = "https://files.pythonhosted.org/packages/f5/6c/86644987505dcb90ba6d627d6989c27bafb0699f9fd00187e06d05ea8594/numcodecs-0.16.5-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:94ddfa4341d1a3ab99989d13b01b5134abb687d3dab2ead54b450aefe4ad5bd6", size = 1148899, upload-time = "2025-11-21T02:49:26.87Z" },
+    { url = "https://files.pythonhosted.org/packages/97/1e/98aaddf272552d9fef1f0296a9939d1487914a239e98678f6b20f8b0a5c8/numcodecs-0.16.5-cp312-cp312-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:b554ab9ecf69de7ca2b6b5e8bc696bd9747559cb4dd5127bd08d7a28bec59c3a", size = 8534814, upload-time = "2025-11-21T02:49:28.547Z" },
+    { url = "https://files.pythonhosted.org/packages/fb/53/78c98ef5c8b2b784453487f3e4d6c017b20747c58b470393e230c78d18e8/numcodecs-0.16.5-cp312-cp312-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:ad1a379a45bd3491deab8ae6548313946744f868c21d5340116977ea3be5b1d6", size = 9173471, upload-time = "2025-11-21T02:49:30.444Z" },
+    { url = "https://files.pythonhosted.org/packages/1c/20/2fdec87fc7f8cec950d2b0bea603c12dc9f05b4966dc5924ba5a36a61bf6/numcodecs-0.16.5-cp312-cp312-win_amd64.whl", hash = "sha256:845a9857886ffe4a3172ba1c537ae5bcc01e65068c31cf1fce1a844bd1da050f", size = 801412, upload-time = "2025-11-21T02:49:32.123Z" },
+]
+
 [[package]]
 name = "numpy"
 version = "2.2.6"
@@ -3850,7 +3879,10 @@ dependencies = [
     { name = "unum" },
     { name = "vivarium-core" },
     { name = "vl-convert-python" },
+    { name = "xarray" },
     { name = "xmltodict" },
+    { name = "zarr" },
+    { name = "zarrs" },
 ]
 
 [package.optional-dependencies]
@@ -3933,7 +3965,10 @@ requires-dist = [
     { name = "unum" },
     { name = "vivarium-core" },
     { name = "vl-convert-python" },
+    { name = "xarray", specifier = ">=2026.4" },
     { name = "xmltodict" },
+    { name = "zarr", specifier = "~=3.1.6" },
+    { name = "zarrs", specifier = ">=0.2" },
 ]
 provides-extras = ["dev", "docs"]
 
@@ -4067,16 +4102,16 @@ wheels = [
 
 [[package]]
 name = "xarray"
-version = "2025.12.0"
+version = "2026.4.0"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "numpy" },
     { name = "packaging" },
     { name = "pandas" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/d3/af/7b945f331ba8911fdfff2fdfa092763156119f124be1ba4144615c540222/xarray-2025.12.0.tar.gz", hash = "sha256:73f6a6fadccc69c4d45bdd70821a47c72de078a8a0313ff8b1e97cd54ac59fed", size = 3082244, upload-time = "2025-12-05T21:51:22.432Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/4b/a6/6fe936a798a3a38a79c7422d1a31afd2e9a14690fcb0ccff96bc01f04bf2/xarray-2026.4.0.tar.gz", hash = "sha256:c4ac9a01a945d90d5b1628e2af045099a9d4943536d4f2ee3ae963c3b222d15b", size = 3132311, upload-time = "2026-04-13T19:45:36.688Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/d5/e4/62a677feefde05b12a70a4fc9bdc8558010182a801fbcab68cb56c2b0986/xarray-2025.12.0-py3-none-any.whl", hash = "sha256:9e77e820474dbbe4c6c2954d0da6342aa484e33adaa96ab916b15a786181e970", size = 1381742, upload-time = "2025-12-05T21:51:20.841Z" },
+    { url = "https://files.pythonhosted.org/packages/dc/83/6d810a8a9ebc9c307989b418840c20e46907c74d707beb67ab566773e6fc/xarray-2026.4.0-py3-none-any.whl", hash = "sha256:d43751d9fb4a90f9249c30431684f00c41bc874f1edccd862631a40cbc0edf08", size = 1414326, upload-time = "2026-04-13T19:45:34.659Z" },
 ]
 
 [[package]]
@@ -4133,6 +4168,45 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/b4/2d/2345fce04cfd4bee161bf1e7d9cdc702e3e16109021035dbb24db654a622/yarl-1.20.1-py3-none-any.whl", hash = "sha256:83b8eb083fe4683c6115795d9fc1cfaf2cbbefb19b3a1cb68f6527460f483a77", size = 46542, upload-time = "2025-06-10T00:46:07.521Z" },
 ]
 
+[[package]]
+name = "zarr"
+version = "3.1.6"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "donfig" },
+    { name = "google-crc32c" },
+    { name = "numcodecs" },
+    { name = "numpy" },
+    { name = "packaging" },
+    { name = "typing-extensions" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/31/5a/b8a0cf39a14c770c30bd1f2d120c54000c8cd9e84e8e79f38d9a7ce58071/zarr-3.1.6.tar.gz", hash = "sha256:d95e72cbea4b90e9a70679468b8266400331756232576ae2b43400ac5108d0eb", size = 386531, upload-time = "2026-03-23T17:25:18.748Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/de/7c/ba8ca8cbe9dbef8e83a95fc208fed8e6686c98b4719aaa0aa7f3d31fe390/zarr-3.1.6-py3-none-any.whl", hash = "sha256:b5a82c5079d1c3d4ee8f06746fa3b9a98a7d804300fa3f4be154362a33e1207e", size = 295655, upload-time = "2026-03-23T17:25:17.189Z" },
+]
+
+[[package]]
+name = "zarrs"
+version = "0.2.3"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "numpy" },
+    { name = "zarr" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/f9/b3/9e088d4ab5c971e5d2b52cd4d58e3acce35acb3e131990fdc28b69366233/zarrs-0.2.3.tar.gz", hash = "sha256:61640dbbffb9a0b0ebd73f970ce97b52ef56df2828c2809058016d76da59ee60", size = 64827, upload-time = "2026-03-27T08:47:44.186Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/4a/c0/e10e618293351247e948527c0d2b4c3d8fa9f7478e9f8e945755fc47ecdc/zarrs-0.2.3-cp311-abi3-macosx_10_12_x86_64.whl", hash = "sha256:b9470b17629961badf4261fb0d26ad5fcbe316b63c1b00fb0489a51c3f8ef157", size = 6276814, upload-time = "2026-03-27T08:47:24.992Z" },
+    { url = "https://files.pythonhosted.org/packages/80/ad/8a8525a72190db2c8d6807c69695ef0ea959fd50a4ac887af80803ff5487/zarrs-0.2.3-cp311-abi3-macosx_11_0_arm64.whl", hash = "sha256:e6998bf1a61cd7c4afd3c263130317c1001599b37ff6f27082cc900a0ad48baa", size = 5776732, upload-time = "2026-03-27T08:47:26.685Z" },
+    { url = "https://files.pythonhosted.org/packages/56/63/27f9f7784006a900ffaa3d62d5c4d0dde98821683cd298cad79f66aa25c5/zarrs-0.2.3-cp311-abi3-manylinux_2_28_aarch64.whl", hash = "sha256:19b194f80139b838bb4bf18ed6ef93ecb1904717a04695fbc50cdc0c6074f282", size = 6139081, upload-time = "2026-03-27T08:47:28.465Z" },
+    { url = "https://files.pythonhosted.org/packages/59/a9/28b91493c7db9f3db191a1bc396cd2e212559536f2bc7325e5d5cdbb8b53/zarrs-0.2.3-cp311-abi3-manylinux_2_28_armv7l.whl", hash = "sha256:59a29dfdea088bb25c1e9b5107cbb8de15c8d571d51484ff128cd526c40521b9", size = 5966557, upload-time = "2026-03-27T08:47:30.064Z" },
+    { url = "https://files.pythonhosted.org/packages/3f/c1/0aba516796af22be08e82e37ded59f46cc7ffabf6932957455fccb9c6109/zarrs-0.2.3-cp311-abi3-manylinux_2_28_ppc64le.whl", hash = "sha256:1d387b75a19c31795cb2a81ef973c905c2c04ca3b1a4cca4bc84c81050974827", size = 6736692, upload-time = "2026-03-27T08:47:31.988Z" },
+    { url = "https://files.pythonhosted.org/packages/c5/fa/471e2511b0c77419ac2228ce72770e94e994ab99c6b9275cb3de1dcead2d/zarrs-0.2.3-cp311-abi3-manylinux_2_28_x86_64.whl", hash = "sha256:ab4074056f01f3292c89cd769e8c0db92c0df076e3d36665eec7fc557a62a2ed", size = 6467125, upload-time = "2026-03-27T08:47:34.107Z" },
+    { url = "https://files.pythonhosted.org/packages/a9/6a/7a4230676bd66c0181b4e9000bec30deee1b1695557e5d245514f0454103/zarrs-0.2.3-cp311-abi3-musllinux_1_2_aarch64.whl", hash = "sha256:9db202e95c3b5c9116afdfebf9912e1faa5ab60e6a1982e0406953cdb47bec38", size = 12507436, upload-time = "2026-03-27T08:47:36.138Z" },
+    { url = "https://files.pythonhosted.org/packages/e3/85/7ad323d428540ca7add343ade347841d181e4e3d73a69f39e34e447f0acc/zarrs-0.2.3-cp311-abi3-musllinux_1_2_armv7l.whl", hash = "sha256:991556a7589e93bc5445da2b97e0c89d7d871e539b9ef28dae857b8573c65f5c", size = 12209703, upload-time = "2026-03-27T08:47:38.619Z" },
+    { url = "https://files.pythonhosted.org/packages/6c/90/ca544236092ab4803d1c3c88ac7b143885e280a63954d454d60885784af8/zarrs-0.2.3-cp311-abi3-musllinux_1_2_x86_64.whl", hash = "sha256:437dd4fcf74607480361f401f15b47416aa69f0ff4379c4ea330c453b7e05098", size = 13044036, upload-time = "2026-03-27T08:47:40.589Z" },
+    { url = "https://files.pythonhosted.org/packages/7f/c1/be4e37d80a95347334c287cbb42d94c6181d447f1624c0c5354f593e1fda/zarrs-0.2.3-cp311-abi3-win_amd64.whl", hash = "sha256:72eb1f5c4ca8382cb9e38dd98a48a0e484170d703152110f32a39520c7fa570d", size = 5854312, upload-time = "2026-03-27T08:47:42.856Z" },
+]
+
 [[package]]
 name = "zipp"
 version = "3.23.0"

From 888a955fc2ce1fb86f326e2dd246ecc52dc94d48 Mon Sep 17 00:00:00 2001
From: ntfrgl <b.beronov@gmail.com>
Date: Mon, 11 May 2026 19:35:57 -0700
Subject: [PATCH 2/4] Implement PR feedback (1)

Fix Nextflow invocation with `XarrayEmitter`:
  - convert in `XarrayEmitter.__init__()`:
    `out_{dir,uri}` -> `writer.store`
  - add Nextflow invocation example for a multi-variant,
    multi-seed, multi-generation simulation workflow:
    `configs/test_configs/test_xarray_workflow.json`

Fix effect of cell division event on `XarrayEmitter`:
  - skip `XarrayBuffer.write()` when `len(data["agents"]) > 1`
  - adjust mocking of `EcoliSim.persist_generation()` in
    `MockEcoliSimWorkflow.init_sim()` to reduce CI runtime

Ancillary improvements:
  - fix `EmitPath.metadata_path()`
  - fix some minor refactoring leftovers
  - filter warnings in `AsyncZarrBufferWriter._open_store()`
    for `generation > 1`
  - add `XarrayTransducer.emitted_sim_tix` for more accurate
    `AsyncBufferWriter.log_effect()`
  - add `XarrayTransducer.buf_shifts` for more robust
    runtime assertions in `XarrayTransducer` and `VariableSpec`
---
 configs/test_configs/test_xarray_emitter.json |  14 ++-
 .../test_configs/test_xarray_workflow.json    |  47 ++++++++
 ecoli/experiments/ecoli_master_sim.py         |  34 +++---
 ecoli/library/parquet_emitter.py              |   5 +-
 ecoli/library/test_utils.py                   |   3 +-
 ecoli/library/xarray_emitter/__init__.py      |   8 +-
 ecoli/library/xarray_emitter/emit_path.py     |  15 +--
 .../library/xarray_emitter/emit_predicate.py  |   2 -
 ecoli/library/xarray_emitter/emitter.py       |  61 ++++++++--
 ecoli/library/xarray_emitter/storage.py       |   3 +-
 .../xarray_emitter/test_xarray_emitter.py     |  25 ++--
 ecoli/library/xarray_emitter/transducer.py    |  73 ++++++++----
 ecoli/library/xarray_emitter/view.py          |   6 +-
 ecoli/library/xarray_emitter/writer.py        |  86 ++++++++------
 ecoli/library/xarray_emitter/zarr_writer.py   | 112 +++++++++---------
 runscripts/test_workflow.py                   |  16 ++-
 runscripts/workflow.py                        |  33 ++----
 17 files changed, 336 insertions(+), 207 deletions(-)
 create mode 100644 configs/test_configs/test_xarray_workflow.json

diff --git a/configs/test_configs/test_xarray_emitter.json b/configs/test_configs/test_xarray_emitter.json
index 0c4532c71..95feffc53 100644
--- a/configs/test_configs/test_xarray_emitter.json
+++ b/configs/test_configs/test_xarray_emitter.json
@@ -9,6 +9,7 @@
   "log_updates": true,
   "emitter": "xarray",
   "emitter_arg": {
+    "out_dir": "out/tests",
     "debug": false,
     "transducer": {
       "predicate": [
@@ -22,7 +23,6 @@
       }
     },
     "writer": {
-      "store": "out/store",
       "threaded": true,
       "buffers_per_chunk": 2,
       "backend": "zarr",
@@ -73,6 +73,18 @@
           }]
         }
       },
+      {
+        "root": ["listeners"],
+        "variables": {
+          "fba_results": {
+            "reaction_fluxes": [{
+              "path": "metabolism/fluxes/internal/rxn_global_listener",
+              "unit": "[mmol/L.s]",
+              "dtype": "<f4"
+            }]
+          }
+        }
+      },
       {
         "root": ["log_update", "ecoli-metabolism", "listeners"],
         "variables": {
diff --git a/configs/test_configs/test_xarray_workflow.json b/configs/test_configs/test_xarray_workflow.json
new file mode 100644
index 000000000..db1e15ac1
--- /dev/null
+++ b/configs/test_configs/test_xarray_workflow.json
@@ -0,0 +1,47 @@
+{
+  "experiment_id": "test_xarray_workflow",
+  "sim_data_path": "out/kb/simData.cPickle",
+  "suffix_time": false,
+  "fail_at_max_duration": true,
+  "generations": 6,
+  "n_init_sims": 10,
+  "skip_baseline": false,
+  "variants": {
+    "condition": {"condition": {"value": ["with_aa", "acetate"]}
+    }
+  },
+  "emitter": "xarray",
+  "emitter_arg": {
+    "out_dir": "out/experiments",
+    "transducer": {
+      "predicate": [
+        [{"subsample": {"interval": 3}}]
+      ],
+      "buffer": {"size": 200}
+    },
+    "writer": {
+      "threaded": true,
+      "buffers_per_chunk": 1,
+      "backend": "zarr",
+      "backend_config": {
+        "format": 3,
+        "async.concurrency": 3,
+        "threading.max_workers": 3
+      }
+    },
+    "view": [
+      {
+        "root": ["listeners"],
+        "variables": {
+          "fba_results": {
+            "reaction_fluxes": [{
+              "path": "metabolic_fluxes",
+              "unit": "[mmol/L.s]",
+              "dtype": "<f4"
+            }]
+          }
+        }
+      }
+    ]
+  }
+}
diff --git a/ecoli/experiments/ecoli_master_sim.py b/ecoli/experiments/ecoli_master_sim.py
index efa2aca2e..ab95c92fb 100644
--- a/ecoli/experiments/ecoli_master_sim.py
+++ b/ecoli/experiments/ecoli_master_sim.py
@@ -778,7 +778,7 @@ def update_experiment(
                     # Exit so that `.run()` does not raise `TimeLimitError`.
                     sys.exit()
 
-    def persist_generation(self, *, num_agents: int = 2) -> None:
+    def persist_generation(self, *, mock: bool = False) -> None:
         """
         Upon reaching cell division, save the daughter cell states to JSON files
         in the directory specified by ``config['daughter_outdir']``. Also,
@@ -790,15 +790,18 @@ def persist_generation(self, *, num_agents: int = 2) -> None:
         Called by: :py:meth:`~.update_experiment`.
 
         Args:
-            num_agents: Expected number of cells. This argument exists solely
-                        for testing purposes.
+            mock: This argument exists solely for testing purposes, and has the
+                  effect of reducing costly file system operations.
         """
         state = self.ecoli_experiment.state.get_value(condition=not_a_process)
-        assert len(state["agents"]) == num_agents
+        assert len(state["agents"]) == 2
         # Daughter state should include all of the additional
         # non-agent state (e.g. environment state)
         non_agent_state = {k: v for k, v in state.items() if k != "agents"}
         for i, (agent_id, agent_state) in enumerate(state["agents"].items()):
+            if mock and i:
+                # skip export of second daughter state
+                continue
             prepare_save_state(agent_state)
             daughter_filename = f"daughter_state_{i}.json"
             daughter_path = cloud_path_join(self.daughter_outdir, daughter_filename)
@@ -813,10 +816,11 @@ def persist_generation(self, *, num_agents: int = 2) -> None:
             f"Divided at t = {self.ecoli_experiment.global_time} after "
             f"{self.ecoli_experiment.global_time - self.initial_global_time} sec."
         )
-        # Nextflow workflows will source division time to determine
-        # initial global time to use for daughter cells
-        with open("division_time.sh", "w") as f:
-            f.write(f"export division_time={self.ecoli_experiment.global_time}")
+        if not mock:
+            # Nextflow workflows will source division time to determine
+            # initial global time to use for daughter cells
+            with open("division_time.sh", "w") as f:
+                f.write(f"export division_time={self.ecoli_experiment.global_time}")
 
     def save_states(self) -> None:
         """
@@ -882,21 +886,11 @@ def run(self) -> None:
             if self.emitter_arg is not None:
                 for key, value in self.emitter_arg.items():
                     self.emitter_config[key] = value
-            if self.emitter == "parquet":
+            if self.emitter in ["parquet", "xarray"]:
                 if not any(map(self.emitter_config.__contains__,
                                ["out_dir", "out_uri"])):
                     raise KeyError(
-                        "Must provide out_dir or out_uri"
-                        " as emitter argument for parquet emitter.")
-            elif self.emitter == "xarray":
-                if not (
-                    not any(map(self.emitter_config.__contains__,
-                                ["out_dir", "out_uri"]))
-                    and "store" in self.emitter_config.get("writer", {})
-                ):
-                    raise KeyError(
-                        "For {\"emitter\": \"xarray\"}, please provide:\n"
-                        "  {\"emitter_arg\": {\"writer\": {\"store\": ... }}}")
+                        "Must provide `out_dir` or `out_uri` in `emitter_arg`.")
         else:
             raise TypeError(
                 "Emitter option must be a string"
diff --git a/ecoli/library/parquet_emitter.py b/ecoli/library/parquet_emitter.py
index 607ed3765..027091fdc 100644
--- a/ecoli/library/parquet_emitter.py
+++ b/ecoli/library/parquet_emitter.py
@@ -921,9 +921,8 @@ def reset_emit_flags(
         """
         assert engine.emitter is self
         if emit_paths:
-            state = self.ecoli_experiment.state
-            state.set_emit_value(emit=False, path=tuple())
-            state.set_emit_values(emit=True, paths=emit_paths)
+            engine.state.set_emit_value(emit=False, path=tuple())
+            engine.state.set_emit_values(emit=True, paths=emit_paths)
 
     def _finalize(self, *, success: bool):
         """
diff --git a/ecoli/library/test_utils.py b/ecoli/library/test_utils.py
index 1fbdd390e..e95ed85da 100644
--- a/ecoli/library/test_utils.py
+++ b/ecoli/library/test_utils.py
@@ -80,7 +80,8 @@ def side_effect(*args, **kwargs) -> Any:
 
 def patch_meth(
     obj: object, meth: str, *,
-    cb: Callable | None = None, modargs: Callable | None = None
+    cb: Callable[..., None] | None = None,
+    modargs: Callable[..., tuple[tuple, dict]] | None = None
 ) -> None:
     """
     Patch an object instance method, in order to trace its calls, and to
diff --git a/ecoli/library/xarray_emitter/__init__.py b/ecoli/library/xarray_emitter/__init__.py
index 6ccb43e76..693c76a02 100644
--- a/ecoli/library/xarray_emitter/__init__.py
+++ b/ecoli/library/xarray_emitter/__init__.py
@@ -76,8 +76,12 @@
 
 .. note::
   See :py:class:`.XarrayEmitter` for an explanation of the JSON configuration
-  syntax, and ``configs/test_configs/test_xarray_emitter.json`` for a complete
-  example.
+  syntax, and for complete examples, see in ``configs/test_configs/``:
+
+  - ``test_xarray_emitter.json`` (CLI invocation via
+    :py:func:`ecoli.experiments.ecoli_master_sim.main`)
+  - ``test_xarray_workflow.json`` (Nextflow invocation via
+    :py:func:`runscripts.workflow.main`).
 
 .. hint::
   As data structures, `DataTree`_\ s could support changes of variable names and
diff --git a/ecoli/library/xarray_emitter/emit_path.py b/ecoli/library/xarray_emitter/emit_path.py
index 7718d7b11..3879d3354 100644
--- a/ecoli/library/xarray_emitter/emit_path.py
+++ b/ecoli/library/xarray_emitter/emit_path.py
@@ -36,7 +36,7 @@ class EmitPathType(Flag):
     """
     listener = auto()
     """
-    Relative path to a ``("listener", ...)``
+    Relative path to a ``("listeners", ...)``
     :py:class:`~vivarium.core.store.Store` created by
     :py:func:`~ecoli.library.schema.listener_schema`.
     """
@@ -125,12 +125,13 @@ def metadata_path(self) -> HierarchyPath:
         """
         Corresponding path within the result of
         :py:meth:`ecoli.experiments.ecoli_master_sim.EcoliSim.output_metadata`.
+        Currently, this is either identical to :py:attr:`.path`, or is the
+        suffix of :py:attr:`.path` starting with ``"listeners"``.
         """
-        if not self.type.is_update_listener:
-            # access process metadata
-            return ()
-        elif EmitPathType.listener in self.type:
+        assert not self.type.is_agent
+        if self.type.is_listener:
             # access listener metadata
-            return ("listeners",)
+            return self.path[self.path.index("listeners"):]
         else:
-            raise NotImplementedError(f"Metadata access for:\n  {self}")
+            # access process metadata
+            return self.path
diff --git a/ecoli/library/xarray_emitter/emit_predicate.py b/ecoli/library/xarray_emitter/emit_predicate.py
index 560db392a..adf4fe2c9 100644
--- a/ecoli/library/xarray_emitter/emit_predicate.py
+++ b/ecoli/library/xarray_emitter/emit_predicate.py
@@ -101,7 +101,6 @@ def build(cls, config: list[dict[str, Any]]) -> Self:
                 cls, "Invalid argument", f"\"predicate\": [{config}]"))
         return cls(list(map(AtomicEmitPredicate.build, config)))
 
-    @abstractmethod
     def __call__(self, sim_tix: int, t: float, data: dict[str, Any], /) -> bool:
         """
         Evaluate the predicate for a simulation step.
@@ -145,7 +144,6 @@ def build(cls, config: list[list[dict[str, Any]]]) -> Self:
                 cls, "Invalid argument", f"\"predicate\": {config}"))
         return cls(list(map(DisjunctiveEmitPredicate.build, config)))
 
-    @abstractmethod
     def __call__(self, sim_tix: int, t: float, data: dict[str, Any], /) -> bool:
         """
         Evaluate the predicate for a simulation step.
diff --git a/ecoli/library/xarray_emitter/emitter.py b/ecoli/library/xarray_emitter/emitter.py
index 0f8f1c8a0..53c1a52c7 100644
--- a/ecoli/library/xarray_emitter/emitter.py
+++ b/ecoli/library/xarray_emitter/emitter.py
@@ -8,6 +8,7 @@
 
 from datetime import datetime
 from pathlib import Path
+from os.path import abspath, join
 from pprint import pp
 from typing import Any, final
 
@@ -44,6 +45,7 @@ class XarrayEmitter(BufferedEmitter):
       {
         "emitter": "xarray",
         "emitter_arg": {
+          "out_uri": "...",
           "transducer": {...},
           "view": [...],
           "writer": {...}
@@ -52,12 +54,20 @@ class XarrayEmitter(BufferedEmitter):
 
     Here,
 
+      - ``out_{dir,uri}``, after possibly having been modified by
+        :py:mod:`runscripts.workflow`, is converted into ``writer.store =
+        "{out_uri}/{experiment_id}/store"``,
       - ``transducer`` is parsed by :py:class:`.XarrayTransducer`,
       - ``view`` is parsed by :py:class:`.ForestView`,
       - and ``writer`` is parsed by :py:class:`.AsyncBufferWriter`.
 
-    For a complete example, see
-    ``configs/test_configs/test_xarray_emitter.json``.
+    .. note::
+      For complete examples, see in ``configs/test_configs/``:
+
+      - ``test_xarray_emitter.json`` (CLI invocation via
+        :py:func:`ecoli.experiments.ecoli_master_sim.main`)
+      - ``test_xarray_workflow.json`` (Nextflow invocation via
+        :py:func:`runscripts.workflow.main`).
     """
 
     __slots__ = ("transducer", "writer", "finalized", "debug")
@@ -81,30 +91,57 @@ class XarrayEmitter(BufferedEmitter):
     """
 
     def __init__(self, config: dict[str, Any], /) -> None:
-        self.validate_config(config)
-        self.debug: bool = config.get("debug", False)
-        """ Flag for debug-level printing. Defaults to ``False``. """
-        self.transducer: XarrayTransducer = XarrayTransducer(config, debug=self.debug)
+        config = self.validate_config(config)
+        self.transducer: XarrayTransducer = XarrayTransducer(config)
         """ Presentation layer. """
         self.writer: AsyncBufferWriter = AsyncBufferWriter.dispatch(config["writer"])
         """ Session layer. """
+        self.debug: bool = config.get("debug", False)
+        """ Flag for debug-level printing. Defaults to ``False``. """
         super().__init__()
 
-    @classmethod
-    def validate_config(cls, config: dict[str, Any], /) -> None:
+    def validate_config(self, config: dict[str, Any], /) -> dict[str, Any]:
         """
-        Check assumptions about static emitter configuration.
+        Check assumptions about static emitter configuration, and convert
+        ``out_{dir,uri}`` into ``writer.store``.
         """
+        # emitter internals
         for key in ["transducer", "view", "writer"]:
             if key not in config:
                 raise KeyError(emitter_arg_error(
-                    cls, "Missing argument", f"\"{key}\": ..."))
+                    self, "Missing argument", f"\"{key}\": ..."))
         match config.get("debug", False):
             case bool():
                 pass
             case debug:
                 raise TypeError(emitter_arg_error(
-                    cls, "Invalid argument", f"\"debug\": {debug}"))
+                    self, "Invalid argument", f"\"debug\": {debug}"))
+
+        # output paths
+        match config.get("out_dir"):
+            case None:
+                match config.get("out_uri"):
+                    case None:
+                        raise KeyError(emitter_arg_error(
+                            self, "Missing store URI", "\"out_uri|out_dir\": ..."))
+                    case str(out):
+                        out_path = out
+                    case out:
+                        raise TypeError(emitter_arg_error(
+                            self, "Invalid output path", f"\"out_uri\": {out}"))
+            case (str() | Path()) as out:
+                out_path = abspath(out)
+            case out:
+                raise TypeError(emitter_arg_error(
+                    self, "Invalid output path", f"\"out_dir\": {out}"))
+        if not (experiment_id := config["experiment_id"]):
+            raise ValueError("Empty `experiment_id`")
+        if (store := config["writer"].get("store")) is not None:
+            raise KeyError(emitter_arg_error(
+                self, "Key should be written by `XarrayEmitter.validate_config()`",
+                f"\"writer\": {{\"store\": {store}}}"))
+        config["writer"]["store"] = join(out_path, experiment_id, "store")
+        return config
 
     # ~~~~~~~~~~~~~~~~~ #
 
@@ -216,7 +253,7 @@ def emit(self, data: dict[str, Any], /):
                     partition=self.extract_partition(metadata),
                     metadata=self.extract_metadata(metadata),
                     coords=self.extract_coords(metadata))
-                self.writer.open_store(self.transducer.buffer)
+                self.writer.open_store(self.transducer)
             # sender: `Engine._emit_store_data()`
             case "history":
                 if not self.transducer.step(payload):
diff --git a/ecoli/library/xarray_emitter/storage.py b/ecoli/library/xarray_emitter/storage.py
index c20c6447e..387067d76 100644
--- a/ecoli/library/xarray_emitter/storage.py
+++ b/ecoli/library/xarray_emitter/storage.py
@@ -283,7 +283,8 @@ def encoding(
                     # use 1 storage chunk for the coordinate array
                     "chunks": coo.shape} | writer.coo_codecs(self)}
             case (True, np.ndarray() as coo):
-                assert coo.shape == (buf_size,)
+                if writer.transducer.buf_shifts:
+                    assert coo.shape == (buf_size,)
                 coo_enc = {self.coo_name: {
                     # use 1 storage chunk for `b` buffers of the time coordinate
                     "chunks": (b * buf_size,)} | writer.coo_codecs(self)}
diff --git a/ecoli/library/xarray_emitter/test_xarray_emitter.py b/ecoli/library/xarray_emitter/test_xarray_emitter.py
index 2ac344815..0bc9c9fd7 100644
--- a/ecoli/library/xarray_emitter/test_xarray_emitter.py
+++ b/ecoli/library/xarray_emitter/test_xarray_emitter.py
@@ -51,6 +51,16 @@ def test_path_type(cls):
         with raises(AssertionError):
             EmitPath(("log_update", "baz", "log_update"))
 
+    @classmethod
+    def test_metadata_path(cls):
+        non_listener = ("foo", "bar")
+        assert EmitPath(non_listener).metadata_path == non_listener
+        listener = ("listeners", "foo", "bar", "7")
+        assert EmitPath(listener).metadata_path == listener
+        assert EmitPath(("log_update", "baz") + listener).metadata_path == listener
+        with raises(AssertionError):
+            EmitPath(("agents", "13")).metadata_path
+
 
 # ==============================================================================
 # integration tests
@@ -76,23 +86,22 @@ class XarrayEmitterConfig(PatchConfig):
     :py:class:`.PatchConfig` for the :py:class:`.XarrayEmitter`.
     """
 
-    store: Path
+    outdir: Path
     zarr_format: int
     threaded: bool
     debug: bool
     interval: int
 
     def __post_init__(self) -> None:
-        assert isinstance(self.store, Path)
-        assert self.store.is_absolute()
-        assert not self.store.exists()
+        assert isinstance(self.outdir, Path)
+        assert self.outdir.is_absolute()
 
     def to_dict(self) -> dict[str, Any]:
         return {
             "emitter": "xarray",
             "emitter_arg": {
+                "out_dir": str(self.outdir),
                 "writer": {
-                    "store": str(self.store),
                     "threaded": self.threaded,
                     "backend": "zarr",
                     "backend_config": {
@@ -184,8 +193,8 @@ def test_workflow(
         assert workdir.is_absolute()
         assert workdir.exists()
         assert not(list(workdir.iterdir()))
-        daughter_outdir = workdir / "daughter_states"
-        store = workdir / "store"
+        daughter_outdir = workdir / config_name / "daughter_states"
+        store = workdir / config_name / "store"
 
         # configure simulation workflow
         wf = MockEcoliSimWorkflow(
@@ -194,7 +203,7 @@ def test_workflow(
             daughter_outdir=daughter_outdir,
             lineage_seed=randint(0, 2**10 - 1),
             emitter_config=XarrayEmitterConfig(
-                store, zarr_format, threaded, debug, interval))
+                workdir, zarr_format, threaded, debug, interval))
 
         # step through workflow
         hline = "=" * 79
diff --git a/ecoli/library/xarray_emitter/transducer.py b/ecoli/library/xarray_emitter/transducer.py
index 14849ed29..2523b55f3 100644
--- a/ecoli/library/xarray_emitter/transducer.py
+++ b/ecoli/library/xarray_emitter/transducer.py
@@ -207,6 +207,11 @@ def write(
           sim_tix: :py:attr:`.XarrayTransducer.sim_tix`.
           t:       Simulation time stamp.
           data:    Input received from :py:meth:`!Engine._emit_store_data`.
+
+        .. note::
+          This method relies on the validity of :py:attr:`.partition` for the
+          current simulation, and hence assumes that it is *not* called after a
+          cell division event.
         """
         # index into buffer along time coordinate
         t_ix = {self.time_coo: buf_tix}
@@ -216,7 +221,9 @@ def write(
 
         # strip agent prefix and remove schema paths with empty emit values
         agent_path = ("agents", self.partition.agent_id)
-        emit_data = dict_to_paths((), get_in(data, agent_path))
+        emit_data = dict_to_paths((), get_in(data, agent_path, default=None))
+        if emit_data == [(), None]:
+            raise KeyError(f"Missing agent ID: {agent_path}")
 
         # check for expected emit paths
         emit_queue = set(self.view.emitted_paths)
@@ -402,10 +409,11 @@ class XarrayTransducer:
 
     __slots__ = (
         "__dict__", "predicate", "buffer",
-        "buf_size", "buf_tix", "sim_tix", "debug"
+        "buf_size", "buf_tix", "sim_tix", "emitted_sim_tix", "buf_shifts",
+        "debug"
     )
 
-    def __init__(self, config: dict[str, Any], /, *, debug: bool=False) -> None:
+    def __init__(self, config: dict[str, Any], /) -> None:
         self.validate_config(_config := config["transducer"])
 
         self.predicate = ConjunctiveEmitPredicate.build(_config["predicate"])
@@ -427,7 +435,17 @@ def __init__(self, config: dict[str, Any], /, *, debug: bool=False) -> None:
         Current absolute *simulation step*; advanced at the end of a
         :py:meth:`.step` call.
         """
-        self.debug: bool = debug
+        self.emitted_sim_tix: int = 0
+        """
+        Latest emitted absolute *simulation step*; advanced at the end of a
+        :py:meth:`.step` call.
+        """
+        self.buf_shifts: int = 0
+        r"""
+        Number of cyclic buffer :py:meth:`.shift`\ s so far.
+        """
+
+        self.debug: bool = config.get("debug", False)
         """ Flag for debug-level printing. Defaults to ``False``. """
 
     @classmethod
@@ -454,8 +472,8 @@ def __str__(self) -> str:
     def display(self, buf: DataTree, /) -> str:
         return (
             f"{self.__class__.__name__}:\n"
-            f"  buf_size: {self.buf_size}\n"
-            f"  sim_tix: {self.sim_tix}, buf_tix: {self.buf_tix}\n"
+            f"  buf_size: {self.buf_size}, buf_tix: {self.buf_tix}\n"
+            f"  sim_tix: {self.sim_tix}, emitted_sim_tix: {self.emitted_sim_tix}\n"
             f"  buffer:{indent(4, buf)}")
 
     # ~~~~~~~~~~~~~~~~~ #
@@ -464,7 +482,10 @@ def check_buffer(self) -> None:
         """
         Basic consistency check, performed before each buffer-level operation.
         """
+        # index into a cyclic buffer
         assert 0 <= self.buf_tix <= self.buf_size
+        # emission lag depends on `self.predicate`
+        assert self.emitted_sim_tix <= self.sim_tix
         self.buffer.check_layout()
 
     def alloc(
@@ -488,9 +509,9 @@ def alloc(
 
     def step(self, data: dict[str, Any], /) -> bool:
         r"""
-        If :py:attr:`.predicate` is satisfied for the current *simulation step*,
-        then create a new *emit step* by writing the simulation data into
-        :py:attr:`.buffer`.
+        If :py:attr:`.predicate` is satisfied for the current *simulation step*
+        and a cell division event has *not* occurred yet, then create a new
+        *emit step* by writing the simulation data into :py:attr:`.buffer`.
 
         Called by: :py:meth:`.XarrayEmitter.emit`.
 
@@ -498,21 +519,24 @@ def step(self, data: dict[str, Any], /) -> bool:
         :py:meth:`.XarrayBuffer.write`.
 
         Args:
-          data: Payload from :py:meth:`.XarrayEmitter.emit`.
+          data: Input received from :py:meth:`!Engine._emit_store_data`.
 
         Returns:
-          `False` if the buffer is full and the operation cannot be performed
-          without first :py:meth:`.flush`\ ing, otherwise `True`.
-        """
-        if self.predicate(self.sim_tix, t := get_in(data, ("time",)), data):
-            if self.buf_tix < self.buf_size:
-                # fill current emit step
-                self.buffer.write(self.buf_tix, self.sim_tix, t, data)
-                # increment emit step
-                self.buf_tix += 1
-            else:
-                # writing now would result in an `IndexError`
-                return False
+          ``False`` if the buffer is full and the operation cannot be performed
+          without first :py:meth:`.flush`\ ing, otherwise ``True``.
+        """
+        if len(data["agents"]) == 1:
+            if self.predicate(self.sim_tix, t := data["time"], data):
+                if self.buf_tix < self.buf_size:
+                    # fill current emit step
+                    self.buffer.write(self.buf_tix, self.sim_tix, t, data)
+                    # increment emit step
+                    self.buf_tix += 1
+                    # record latest emitted simulation step
+                    self.emitted_sim_tix = self.sim_tix
+                else:
+                    # writing now would result in an `IndexError`
+                    return False
         # increment simulation step
         self.sim_tix += 1
         return True
@@ -544,7 +568,7 @@ def flush(
         """
         self.check_buffer()
         if final:
-            assert not include_static
+            assert not (self.buf_shifts and include_static)
             if self.buf_tix < self.buf_size:
                 # at least one unfilled emit step inside allocated buffer
                 self.truncate()
@@ -554,7 +578,7 @@ def flush(
             writer, self.buf_size,
             include_static=include_static, copy=not final)
         writer.merge_attributes(buf)
-        ref = {"sim_step": self.sim_tix,
+        ref = {"sim_step": self.emitted_sim_tix,
                "sim_time": self.buffer.get_time(self.buf_tix - 1)}
         if final:
             # reference to buffer components no longer needed
@@ -575,6 +599,7 @@ def shift(self) -> None:
         self.check_buffer()
         assert self.buf_tix == self.buf_size
         self.buf_tix = 0
+        self.buf_shifts += 1
         self.buffer.shift(self.buf_size)
 
     def truncate(self) -> None:
diff --git a/ecoli/library/xarray_emitter/view.py b/ecoli/library/xarray_emitter/view.py
index e25eaff9b..806a5e1e9 100644
--- a/ecoli/library/xarray_emitter/view.py
+++ b/ecoli/library/xarray_emitter/view.py
@@ -339,10 +339,10 @@ def __post_init__(self) -> None:
         if not len(self.forest):
             raise ValueError(emitter_arg_error(
                 self, "Missing arguments", "\"view\": [...]"))
-        paths = list(chain.from_iterable(t.paths for t in self.forest))
-        if len(frozenset(paths)) != len(paths):
+        roots = [t.root.path for t in self.forest]
+        if len(frozenset(roots)) != len(roots):
             raise ValueError(emitter_arg_error(
-                self, "Duplicate paths", "\"view\": [...]"))
+                self, "Duplicate roots", "\"view\": [...]"))
 
     @classmethod
     def from_dict(cls, config: list[dict[str, Any]], /) -> Self:
diff --git a/ecoli/library/xarray_emitter/writer.py b/ecoli/library/xarray_emitter/writer.py
index 935ed5195..a5cb8f52a 100644
--- a/ecoli/library/xarray_emitter/writer.py
+++ b/ecoli/library/xarray_emitter/writer.py
@@ -14,7 +14,6 @@
 from concurrent.futures import Future, Executor, ThreadPoolExecutor
 from functools import cached_property
 from inspect import ismethod
-from pathlib import Path
 from typing import Any
 from weakref import finalize
 
@@ -124,16 +123,18 @@ class AsyncBufferWriter[StoreT](ABC):
     Example JSON configuration::
 
       {
-        "store": "out/store",
+        "store": "{out_uri}/{experiment_id}/store",
         "threaded": true,
-        "buffers_per_chunk": 10,
+        "buffers_per_chunk": 1,
         "backend": "zarr",
         "backend_config": {...}
       }
 
     Here,
 
-      - ``store`` is a URI interpreted by the backend,
+      - ``store`` is a URI interpreted by the backend, and is currently set by
+        :py:meth:`.XarrayEmitter.validate_config` based on
+        ``emitter_arg.out_{dir,uri}``,
       - ``threaded`` toggles the use of a separate writer thread,
       - ``buffers_per_chunk`` is the integer-valued size ratio, in terms of
         *emit step* counts, between one chunk of backend storage and one
@@ -143,18 +144,22 @@ class AsyncBufferWriter[StoreT](ABC):
       - and ``backend_config`` is interpreted by the backend subclass.
 
     .. note::
-      The parameter ``buffers_per_chunk`` is intended to decouple the number of
-      output files from the choice of ``transducer.buffer.size`` in
-      :py:class:`.XarrayTransducer`. As a rule of thumb, 1 chunk file per
-      variable per generation is desirable in order to minimize the file system
-      pressure, unless a downstream application can benefit from smaller file
-      sizes.
-
-      The latter situation appears to be unlikely under current simulation use
-      cases. However, it may be supported in the future by extending the writer
-      configuration to further distinguish between *chunks* and *shards*, which
-      is `supported`_ by backends like Zarr.
-
+      The parameter ``writer.buffers_per_chunk`` is intended to decouple the
+      number of output files from the choice of ``transducer.buffer.size`` in
+      :py:class:`.XarrayTransducer`. As a rule of thumb:
+
+      -  For **immutable** object storage systems (e.g., Amazon S3 Standard
+         storage class), ``buffers_per_chunk`` must be set to 1, in order to
+         avoid copying previous objects when appending to them.
+      -  For local or HPC file systems, as well as for **appendable** object
+         storage systems (e.g., `Amazon S3 Express One Zone`_ storage class), 1
+         chunk file per variable per generation is desirable in order to
+         minimize the file system pressure. In case future downstream
+         applications require smaller chunk sizes, the writer configuration may
+         be extended to further distinguish between *chunks* and *shards*, which
+         is `supported`_ by backends like Zarr.
+
+    .. _Amazon S3 Express One Zone: https://docs.aws.amazon.com/AmazonS3/latest/userguide/directory-buckets-objects-append.html
     .. _supported: https://zarr.readthedocs.io/en/latest/user-guide/performance/#sharding
     """
 
@@ -178,10 +183,11 @@ def dispatch(cls, config: dict[str, Any], /) -> AsyncBufferWriter:
 
     def __init__(self, config: dict[str, Any], /) -> None:
         self.validate_config(config)
+        self.validate_backend_config(config["backend_config"])
         self.config: dict[str, Any] = config
         """ Static configuration, received via :py:meth:`!Emitter.__init__`. """
 
-        self._buffer: XarrayBuffer | None = None
+        self._transducer: XarrayTransducer | None = None
         self._store: StoreT | None = None
         self._store_finalizer: Callable[[], None] | None = None
         """ Finalizer for :py:attr:`.store`. """
@@ -198,15 +204,8 @@ def __init__(self, config: dict[str, Any], /) -> None:
     @classmethod
     def validate_config(cls, config: dict[str, Any], /) -> None:
         """
-        Check assumptions about static writer configuration.
+        Check assumptions about backend-agnostic writer configuration.
         """
-        match config["store"]:
-            case (str() | Path()) as store if not str(store).endswith("/"):
-                pass
-            case store:
-                raise TypeError(emitter_arg_error(
-                    cls, "Invalid store path",
-                    f"\"writer\": {{\"store\": \"{store}\"}}"))
         match config.get("buffers_per_chunk"):
             case None:
                 raise KeyError(emitter_arg_error(
@@ -230,21 +229,36 @@ def validate_config(cls, config: dict[str, Any], /) -> None:
                     cls, "Invalid argument",
                     f"\"writer\": {{\"backend_config\": {c}}}"))
 
+    @classmethod
+    @abstractmethod
+    def validate_backend_config(cls, config: dict[str, Any], /) -> None:
+        """
+        Check assumptions about backend-specific writer configuration.
+        """
+        ...
+
     # ~~~~~~~~~~~~~~~~~ #
 
     @property
-    def buffer(self) -> XarrayBuffer:
+    def transducer(self) -> XarrayTransducer:
         """
         Dynamic configuration, received via :py:meth:`!Engine._emit_configuration`.
         """
-        assert self._buffer is not None
-        return self._buffer
+        assert self._transducer is not None
+        return self._transducer
+
+    @transducer.setter
+    def transducer(self, transducer: XarrayTransducer) -> None:
+        assert self._transducer is None
+        assert isinstance(transducer, XarrayTransducer)
+        self._transducer = transducer
 
-    @buffer.setter
-    def buffer(self, buffer: XarrayBuffer) -> None:
-        assert self._buffer is None
-        assert isinstance(buffer, XarrayBuffer)
-        self._buffer = buffer
+    @property
+    def buffer(self) -> XarrayBuffer:
+        """
+        Dynamic configuration, received via :py:meth:`!Engine._emit_configuration`.
+        """
+        return self.transducer.buffer
 
     @property
     def partition(self) -> XarrayStoragePartition:
@@ -263,7 +277,7 @@ def store_type(self) -> type[StoreT]:
         """
         ...
 
-    def open_store(self, buffer: XarrayBuffer, /) -> None:
+    def open_store(self, transducer: XarrayTransducer, /) -> None:
         """
         Initialise the transport layer.
 
@@ -273,7 +287,7 @@ def open_store(self, buffer: XarrayBuffer, /) -> None:
           buffer: Used for obtaining dynamic metadata that is received through
                   :py:meth:`!Engine._emit_configuration`.
         """
-        self.buffer = buffer
+        self.transducer = transducer
         self.store = self._open_store()
 
     @abstractmethod
@@ -361,7 +375,7 @@ def warnings_eval_effect(cls) -> list[WarningFilter]:
 
     @cached_property
     def _warnings_eval_effect(self) -> list[WarningFilter]:
-        return self.warnings_make_effect()
+        return self.warnings_eval_effect()
 
     @classmethod
     def warnings_all(cls) -> list[WarningFilter]:
diff --git a/ecoli/library/xarray_emitter/zarr_writer.py b/ecoli/library/xarray_emitter/zarr_writer.py
index e5c9b0c54..e39f43f29 100644
--- a/ecoli/library/xarray_emitter/zarr_writer.py
+++ b/ecoli/library/xarray_emitter/zarr_writer.py
@@ -505,10 +505,8 @@ class AsyncZarrBufferWriter(AsyncBufferWriter[ZarrStore]):
     """
 
     @classmethod
-    def validate_config(cls, config: dict[str, Any], /) -> None:
-        super().validate_config(config)
-        zarr_config = config["backend_config"]
-        match zarr_config.get("format"):
+    def validate_backend_config(cls, config: dict[str, Any], /) -> None:
+        match config.get("format"):
             case None:
                 raise KeyError(emitter_arg_error(
                     cls, "Missing argument",
@@ -534,18 +532,19 @@ def _open_group(self) -> Group:
 
         Calls: :py:func:`zarr.open_group`.
         """
-        return zarr.open_group(
-            # URI for global store holding entire workflow
-            self.config["store"],
-            # independent substore holding current simulation subensemble
-            path=str(self.partition.independent_path),
-            # enforce explicit format choice
-            zarr_format=self.config["backend_config"]["format"],
-            # load consolidated metadata from previous generations
-            use_consolidated=True,
-            # only allow appending
-            mode="a",
-        )
+        with filter_warnings(self._warnings_eval_effect):
+            return zarr.open_group(
+                # URI for global store holding entire workflow
+                self.config["store"],
+                # independent substore holding current simulation subensemble
+                path=str(self.partition.independent_path),
+                # enforce explicit format choice
+                zarr_format=self.config["backend_config"]["format"],
+                # load consolidated metadata from previous generations
+                use_consolidated=True,
+                # only allow appending
+                mode="a",
+            )
 
     def _check_group(self, group: Group) -> Group:
         """
@@ -629,19 +628,22 @@ def _open_store(self) -> ZarrStore:
                 "direct_io": False,
             }
         })
-        return ZarrStore(
-            self._cache_consolidated_metadata(
-                self._check_group(self._open_group())),
-            # only allow appending along time axis
-            mode="a-",
-            # manage cache updates in `self.update_transport()`
-            cache_members=True,
-            # consolidate only after simulation finishes through Zarr API,
-            # rather than after every write through Xarray API
-            consolidate_on_close=False,
-            # finalise Zarr API
-            close_store_on_close=True,
-        )
+        group = self._cache_consolidated_metadata(
+            self._check_group(
+                self._open_group()))
+        with filter_warnings(self._warnings_eval_effect):
+            return ZarrStore(
+                group,
+                # only allow appending along time axis
+                mode="a-",
+                # manage cache updates in `self.update_transport()`
+                cache_members=True,
+                # consolidate only after simulation finishes through Zarr API,
+                # rather than after every write through Xarray API
+                consolidate_on_close=False,
+                # finalise Zarr API
+                close_store_on_close=True,
+            )
 
     # ~~~~~~~~~~~~~~~~~ #
 
@@ -689,38 +691,36 @@ def var_codecs(self, var: VariableSpec, /) -> VariableEncoding:
 
     # ~~~~~~~~~~~~~~~~~ #
 
+    _zarr_warnings: dict[str, WarningFilter] = {
+        "consolidated_metadata": WarningFilter(
+            module="zarr.api.asynchronous",
+            category=ZarrUserWarning,
+            message="Consolidated metadata.*Zarr format 3",
+            action="ignore"),
+        "string": WarningFilter(
+            module="zarr.core.dtype.npy.string",
+            category=UnstableSpecificationWarning,
+            message=".*data type.*Zarr V3",
+            action="ignore"),
+        "numcodecs": WarningFilter(
+            module="zarr.codecs.numcodecs",
+            category=ZarrUserWarning,
+            message=".*Numcodecs codecs.*Zarr version 3 specification",
+            action="ignore"),
+        "zarrs": WarningFilter(
+            module="zarrs.pipeline",
+            category=UserWarning,
+            message="Array is unsupported by ZarrsCodecPipeline",
+            action="ignore")
+    }
+
     @classmethod
     def warnings_make_effect(cls) -> list[WarningFilter]:
-        return [
-            WarningFilter(
-                module="zarr.api.asynchronous",
-                category=ZarrUserWarning,
-                message="Consolidated metadata.*Zarr format 3",
-                action="ignore"),
-            WarningFilter(
-                module="zarr.core.dtype.npy.string",
-                category=UnstableSpecificationWarning,
-                message=".*data type.*Zarr V3",
-                action="ignore"),
-            WarningFilter(
-                module="zarr.codecs.numcodecs",
-                category=ZarrUserWarning,
-                message=".*Numcodecs codecs.*Zarr version 3",
-                action="ignore"),
-            WarningFilter(
-                module="zarrs.pipeline",
-                category=UserWarning,
-                message="Array is unsupported by ZarrsCodecPipeline",
-                action="ignore")]
+        return list(cls._zarr_warnings.values())
 
     @classmethod
     def warnings_eval_effect(cls) -> list[WarningFilter]:
-        return [
-            WarningFilter(
-                module="zarrs.pipeline",
-                category=UserWarning,
-                message="Array is unsupported by ZarrsCodecPipeline",
-                action="ignore")]
+        return [cls._zarr_warnings[w] for w in ["numcodecs", "zarrs"]]
 
     # ~~~~~~~~~~~~~~~~~ #
 
diff --git a/runscripts/test_workflow.py b/runscripts/test_workflow.py
index 741306e09..e54676fa5 100644
--- a/runscripts/test_workflow.py
+++ b/runscripts/test_workflow.py
@@ -186,7 +186,7 @@ def __post_init__(self) -> None:
         # - loaded by: `ecoli.composites.ecoli_master.Ecoli.initial_state()`
         assert isinstance(self.daughter_outdir, Path)
         assert self.daughter_outdir.is_absolute()
-        self.daughter_outdir.mkdir(exist_ok=False)
+        self.daughter_outdir.mkdir(parents=True, exist_ok=True)
         self.initial_state_file = self.daughter_outdir / self.initial_state_name
 
         # initialise the seed stream, emulating:
@@ -243,7 +243,7 @@ def update_experiment(_self: EcoliSim, _) -> None:
             engine = _self.ecoli_experiment
 
             # method called conditionally on exception `DivisionDetected`
-            def persist_generation(_: EcoliSim, *, num_agents: int = 2) -> tuple:
+            def persist_generation(_: EcoliSim) -> tuple[tuple, dict]:
                 nonlocal self, engine
                 # emulate the environment variable `division_time`
                 self.division_time = engine.global_time
@@ -251,12 +251,10 @@ def persist_generation(_: EcoliSim, *, num_agents: int = 2) -> tuple:
                 agents = engine.state.get_path(("agents",))
                 assert isinstance(agents, Store)
                 assert list(agents.inner.keys()) == [self.agent_id]
-                daughter_id = daughter_phylogeny_id(self.agent_id)[0]
                 daughter_state = agents.get_path((self.agent_id,))
-                agents.inner = {daughter_id: daughter_state}
-                # expect 1 agent in the wrapped method
-                assert num_agents == 2
-                return ((), {"num_agents": 1})
+                agents.inner = {i: daughter_state
+                                for i in daughter_phylogeny_id(self.agent_id)}
+                return ((), {"mock": True})
             patch_meth(_self, "persist_generation", modargs=persist_generation)
 
             # patch applied conditionally on test flag `success`
@@ -275,8 +273,8 @@ def sim_gen(self, success: bool, /) -> StoragePartition:
         """
         Emulate ``runscripts/nextflow/sim.nf::{simGen0,sim}()`` by starting a
         single-generation simulation, stopping at ``config["max_duration"]``,
-        and storing the resulting cell state to disk, without waiting for an
-        actual cell division.
+        and storing the resulting single cell state to disk, without waiting for
+        an actual cell division.
 
         Calls: :py:meth:`.init_sim`.
 
diff --git a/runscripts/workflow.py b/runscripts/workflow.py
index d661ef1f8..28d5b85a6 100644
--- a/runscripts/workflow.py
+++ b/runscripts/workflow.py
@@ -534,11 +534,11 @@ def strip_resource_keys(config: dict) -> dict:
     return stripped
 
 
-CONFIG_DIR_PATH = os.path.join(
-    os.path.dirname(os.path.dirname(os.path.abspath(__file__))),
-    "configs",
-)
-NEXTFLOW_DIR = os.path.join(os.path.dirname(os.path.abspath(__file__)), "nextflow")
+RUNSCRIPTS_DIR = os.path.dirname(os.path.abspath(__file__))
+REPO_DIR = os.path.dirname(RUNSCRIPTS_DIR)
+CONFIG_DIR_PATH = os.path.join(REPO_DIR, "configs")
+NEXTFLOW_DIR = os.path.join(RUNSCRIPTS_DIR, "nextflow")
+CONTAINER_DIR = os.path.join(RUNSCRIPTS_DIR, "container")
 
 # These input channels calculate the values that the analysis jobs defined in
 # runscripts/nextflow/analysis.nf consume.
@@ -1012,9 +1012,7 @@ def get_cluster_config(
 
 
 def build_image_cmd(image_name, apptainer=False) -> list[str]:
-    build_script = os.path.join(
-        os.path.dirname(__file__), "container", "build-image.sh"
-    )
+    build_script = os.path.join(CONTAINER_DIR, "build-image.sh")
     cmd = [build_script, "-i", image_name]
     if apptainer:
         cmd.append("-a")
@@ -1075,9 +1073,7 @@ def run_ecr_script(image: str, build: bool, region: str = "us-gov-west-1") -> st
     Returns:
         Full ECR image URI.
     """
-    build_script = os.path.join(
-        os.path.dirname(__file__), "container", "build-and-push-ecr.sh"
-    )
+    build_script = os.path.join(CONTAINER_DIR, "build-and-push-ecr.sh")
 
     # Parse the container_image to extract repo name and tag
     # Expected format: <account>.dkr.ecr.<region>.amazonaws.com/<repo>:<tag>
@@ -1350,11 +1346,7 @@ def main():
     # Load .env from the repository root so that variables like NXF_VER are
     # set even when the script is invoked directly with python (e.g. on HPC/
     # cloud) rather than via ``uv run --env-file .env``.
-    _load_dotenv(
-        os.path.join(
-            os.path.dirname(os.path.dirname(os.path.abspath(__file__))), ".env"
-        )
-    )
+    _load_dotenv(os.path.join(REPO_DIR, ".env"))
     parser = argparse.ArgumentParser()
     config_file = os.path.join(CONFIG_DIR_PATH, "default.json")
     parser.add_argument(
@@ -1439,8 +1431,7 @@ def main():
     if cluster_config and cluster_config.jenkins:
         config["lineage_seed"] = random.randint(0, 2**31 - 1)
 
-    repo_dir = os.path.dirname(os.path.dirname(__file__))
-    local_outdir = os.path.join(repo_dir, "nextflow_temp", experiment_id)
+    local_outdir = os.path.join(REPO_DIR, "nextflow_temp", experiment_id)
     os.makedirs(local_outdir, exist_ok=True)
     if filesystem is None:
         if os.path.exists(exp_outdir) and not args.resume:
@@ -1478,7 +1469,7 @@ def main():
     if args.resume is None:
         copy_to_filesystem(temp_stripped_path, final_stripped_path, filesystem)
 
-    nf_config = os.path.join(os.path.dirname(__file__), "nextflow", "config.template")
+    nf_config = os.path.join(NEXTFLOW_DIR, "config.template")
     with open(nf_config, "r") as f:
         nf_config = f.readlines()
     nf_config = "".join(nf_config)
@@ -1572,9 +1563,7 @@ def main():
 
     run_parca, sim_imports, sim_workflow = generate_code(config)
 
-    nf_template_path = os.path.join(
-        os.path.dirname(__file__), "nextflow", "template.nf"
-    )
+    nf_template_path = os.path.join(NEXTFLOW_DIR, "template.nf")
     with open(nf_template_path, "r") as f:
         nf_template = f.readlines()
     nf_template = "".join(nf_template)

From f62a183ac61e51cd721d81ed8e216b99eac81190 Mon Sep 17 00:00:00 2001
From: ntfrgl <b.beronov@gmail.com>
Date: Sun, 17 May 2026 16:32:38 -0700
Subject: [PATCH 3/4] Fixes to Xarray/Zarr metadata emission

Fix Xarray attributes for child variables:
  - fix `VariableSpec.attr_name`
  - always resend attributes in `XarrayBuffer.render()` to avoid
    erasure by `xarray.backends.writers.dump_to_store()`

Fix chunk spec for `generation > 1`:
  - separate logical time predicates
    `AsyncBufferWriter.is_1st_buf_in_{lineage,generation}`
  - add kwarg `VariableSpec.encoding(include_coo: bool)`

Extend integration test `test_xarray_emitter.TestEcoliSim`:
  - add `buffers_per_chunk` to test parameters
  - complete `.check_tree_shape()`
  - add `.check_chunks()`
  - add `.check_codecs()` with comparison key `.zarr_codec_key()`

Ancillary improvements:
  - separate methods `XarrayBuffer.{render,encodings}()`
  - explicitly specify default Zarr codecs in
    `AsyncZarrBufferWriter.coo_codecs()`
---
 ecoli/library/xarray_emitter/storage.py       |  45 ++-
 .../xarray_emitter/test_xarray_emitter.py     | 381 ++++++++++++++++--
 ecoli/library/xarray_emitter/transducer.py    | 152 ++++---
 ecoli/library/xarray_emitter/writer.py        |  61 ++-
 ecoli/library/xarray_emitter/zarr_writer.py   |  69 +++-
 runscripts/test_workflow.py                   |  16 +-
 6 files changed, 572 insertions(+), 152 deletions(-)

diff --git a/ecoli/library/xarray_emitter/storage.py b/ecoli/library/xarray_emitter/storage.py
index 387067d76..24517fd7d 100644
--- a/ecoli/library/xarray_emitter/storage.py
+++ b/ecoli/library/xarray_emitter/storage.py
@@ -208,6 +208,14 @@ def __post_init__(self) -> None:
 
     # ~~~~~~~~~~~~~~~~~ #
 
+    @property
+    def attr_name(self) -> str:
+        """
+        Attribute name used by :py:meth:`.alloc_coord`.
+        """
+        return (self.partition.time_var_name if self.is_time
+                else self.var_name)
+
     @staticmethod
     def var_coo_name(var_name: str, /) -> str:
         """
@@ -262,9 +270,9 @@ def zeros(self, buf_size: int, /) -> np.ndarray:
         return np.zeros(self.dims(buf_size), dtype=self.dtype)
 
     def encoding(
-        self, writer: AsyncBufferWriter, buf_size: int, /
+        self, writer: AsyncBufferWriter, buf_size: int, *, include_coo: bool
     ) -> dict[str, VariableEncoding]:
-        """
+        r"""
         Parameters used for writing a variable array and its coordinate array to
         persistent storage, including chunk sizes and compression codecs.
 
@@ -272,26 +280,31 @@ def encoding(
 
         Calls: :py:meth:`.AsyncBufferWriter.coo_codecs` and
         :py:meth:`.AsyncBufferWriter.var_codecs`.
+
+        Args:
+          writer:       Used for interpreting backend-specific codecs and for
+                        retrieving the `writer.buffers_per_chunk` configuration.
+          buf_size:     :py:attr:`.XarrayTransducer.buf_size`.
+          include_coo:  Include :py:meth:`.AsyncBufferWriter.coo_codecs`.
         """
         b = writer.config["buffers_per_chunk"]
         # coordinate encoding
-        match (self.is_time, self.coord):
-            case (False, None):
-                coo_enc = {}
-            case (False, np.ndarray() as coo):
-                coo_enc = {self.coo_name: {
-                    # use 1 storage chunk for the coordinate array
-                    "chunks": coo.shape} | writer.coo_codecs(self)}
-            case (True, np.ndarray() as coo):
+        coo_enc: dict[str, VariableEncoding] = {}
+        match (include_coo, self.is_time, self.coord):
+            case (True, False, np.ndarray() as coo):
+                coo_enc |= {self.coo_name: writer.coo_codecs(self) | {
+                    # use 1 storage chunk for non-time coordinate
+                    "chunks": coo.shape}}
+            case (True, True, np.ndarray() as coo):
                 if writer.transducer.buf_shifts:
                     assert coo.shape == (buf_size,)
-                coo_enc = {self.coo_name: {
-                    # use 1 storage chunk for `b` buffers of the time coordinate
-                    "chunks": (b * buf_size,)} | writer.coo_codecs(self)}
+                coo_enc |= {self.coo_name: writer.coo_codecs(self) | {
+                    # use 1 storage chunk for `b` buffers of time coordinate
+                    "chunks": (b * buf_size,)}}
         # variable encoding
-        var_enc = {self.datavar_name: {
+        var_enc = {self.datavar_name: writer.var_codecs(self) | {
             # use 1 storage chunk for `b` buffers of simulation data
-            "chunks": self.dims(b * buf_size)} | writer.var_codecs(self)}
+            "chunks": self.dims(b * buf_size)}}
         return coo_enc | var_enc
 
     # ~~~~~~~~~~~~~~~~~ #
@@ -357,7 +370,7 @@ def alloc_coord(self) -> Dataset:
         """
         return Dataset(
             coords={} if self.coord is None else {self.coo_name: self.coord},
-            attrs={} if self.unit is None else {self.datavar_name: self.unit})
+            attrs={} if self.unit is None else {self.attr_name: self.unit})
 
     def alloc_var(self, buf_size: int, /) -> Dataset:
         """
diff --git a/ecoli/library/xarray_emitter/test_xarray_emitter.py b/ecoli/library/xarray_emitter/test_xarray_emitter.py
index 0bc9c9fd7..740ffa336 100644
--- a/ecoli/library/xarray_emitter/test_xarray_emitter.py
+++ b/ecoli/library/xarray_emitter/test_xarray_emitter.py
@@ -6,21 +6,25 @@
 
 from contextlib import ContextDecorator
 from dataclasses import dataclass, field
+from functools import partial
 from pathlib import Path
 from random import randint
-from typing import Any, Self, final, cast
+from typing import Any, Literal, Self, Callable, final, cast
 
 import numpy as np
 from pytest import MonkeyPatch, mark, param, raises
 from xarray import DataArray, DataTree, open_datatree
-from zarr import Group, open_consolidated
+from xarray.core.datatree import NodePath
+from zarr import Array, Group, open_consolidated
 
 from ecoli.library.test_utils import PatchConfig, filter_warnings
 from ecoli.library.xarray_emitter.emit_path import EmitPath, EmitPathType
-from ecoli.library.xarray_emitter.storage import XarrayStoragePartition
-# from ecoli.library.xarray_emitter.emitter import XarrayEmitter
+from ecoli.library.xarray_emitter.view import LeafView, ForestView
+from ecoli.library.xarray_emitter.storage import (
+    XarrayStoragePartition, VariableSpec, VariableEncoding)
 from ecoli.library.xarray_emitter.zarr_writer import (
     AsyncZarrBufferWriter, group_tree)
+from ecoli.library.xarray_emitter.emitter import XarrayEmitter
 from ecoli.library.xarray_emitter.utils import WarningFilter
 from ecoli.processes.metabolism import TIME_UNITS
 
@@ -87,10 +91,11 @@ class XarrayEmitterConfig(PatchConfig):
     """
 
     outdir: Path
-    zarr_format: int
+    zarr_format: Literal[2, 3]
     threaded: bool
     debug: bool
     interval: int
+    buffers_per_chunk: int
 
     def __post_init__(self) -> None:
         assert isinstance(self.outdir, Path)
@@ -103,6 +108,7 @@ def to_dict(self) -> dict[str, Any]:
                 "out_dir": str(self.outdir),
                 "writer": {
                     "threaded": self.threaded,
+                    "buffers_per_chunk": self.buffers_per_chunk,
                     "backend": "zarr",
                     "backend_config": {
                         "format": self.zarr_format
@@ -134,7 +140,7 @@ class StoreResult(ContextDecorator):
 
     store: Path
     partition: XarrayStoragePartition
-    zarr_format: int
+    zarr_format: Literal[2, 3]
     zarr: Group = field(init=False)
     xarray: DataTree = field(init=False)
 
@@ -165,25 +171,40 @@ def close(self) -> None:
 
 
 class TestEcoliSim:
+    """
+    Complete integration test for :py:class:`.XarrayEmitter`, running an
+    abridged multi-generation simulation workflow using
+    :py:class:`.MockEcoliSimWorkflow`, and validating the full round-tripped
+    data structure from the output Zarr store.
+    """
 
     @classmethod
     @filter_warnings(ecolisim_warnings)
     @filter_warnings(AsyncZarrBufferWriter.warnings_all())
     @mark.parametrize(
-        "num_generations, last_success, interval, zarr_format, threaded, debug",
-        [param(*args, **kwargs,
-               id="gen_{}-succ_{}-intvl_{}_zarr_{}-thrd_{}-dbg_{}".format(*args))
-         for (args, kwargs) in [
-            ((1, False, 1, 2, False, True ), {}),
-            ((2, True,  3, 2, True,  False), {}),
-            ((2, True,  2, 3, True,  True), {"marks": mark.basic_workflow}),
-            ((3, False, 1, 3, True,  False), {})
-         ]])
+        "num_generations, last_success, interval, "
+        "buffers_per_chunk, zarr_format, threaded, debug",
+        [
+            param(*args, **kwargs, id=(
+                "gen:{}_succ:{}_intvl:{}_buf:{}_zarr:{}_thrd:{}_dbg:{}"
+            ).format(*args))
+            for (args, kwargs) in [
+                ((1, False, 1, 1, 2, False, True ), {}),
+                ((2, True,  3, 2, 2, True,  False), {}),
+                ((2, True,  2, 1, 3, True,  True), {"marks": mark.basic_workflow}),
+                ((3, False, 1, 3, 3, True,  False), {})
+            ]
+        ]
+    )
     def test_workflow(
         cls, monkeypatch: MonkeyPatch, tmp_path: Path,
         num_generations: int, last_success: bool, interval: int,
-        zarr_format: int, threaded: bool, debug: bool
+        buffers_per_chunk: int, zarr_format: Literal[2, 3],
+        threaded: bool, debug: bool
     ):
+        """
+        Driver for the integration test.
+        """
         # set repository paths
         sim_data_path = Path.cwd() / "out" / "kb" / "simData.cPickle"
         config_name = "test_xarray_emitter"
@@ -203,7 +224,8 @@ def test_workflow(
             daughter_outdir=daughter_outdir,
             lineage_seed=randint(0, 2**10 - 1),
             emitter_config=XarrayEmitterConfig(
-                workdir, zarr_format, threaded, debug, interval))
+                workdir, zarr_format, threaded, debug,
+                interval, buffers_per_chunk))
 
         # step through workflow
         hline = "=" * 79
@@ -211,66 +233,116 @@ def test_workflow(
             print(f"\n{hline}\nGeneration: {g}\n{hline}")
             # execute simulation
             success = (g < num_generations) or last_success
-            partition = cast(XarrayStoragePartition, wf.sim_gen(success))
+            (partition, config) = wf.sim_gen(success)
+            assert isinstance(partition, XarrayStoragePartition)
             # read emitted data
+            view = ForestView.from_dict(config["emitter_arg"]["view"])
             with StoreResult(store, partition, zarr_format) as result:
                 # validate emitted data
-                cls.check_tree(result)
-                cls.check_encoding(result)
-                cls.check_log(result)
-                cls.check_success(result, success)
+                cls.check_tree_shape(result, view)
+                cls.check_log(result, success)
                 cls.check_time(result, interval)
+                cls.check_chunks(result, view, interval, buffers_per_chunk, config)
+                cls.check_codecs(result, view, zarr_format, config)
 
     # ~~~~~~~~~~~~~~~~~ #
 
-    @staticmethod
-    def check_tree(res: StoreResult) -> None:
+    @classmethod
+    def check_tree_shape(cls, res: StoreResult, view: ForestView) -> None:
         """
-        Check the basic integrity of the round-tripped
-        :py:class:`xarray.DataTree`.
+        Check the syntactic integrity of the round-tripped store data structure,
+        for *all generations emitted so far*.
+
+        Calls: :py:meth:`.check_root_node_shape` and
+        :py:meth:`.check_child_node_shape`.
         """
         # let Zarr traverse the store
+        z = res.zarr
         print()
-        print(group_tree(res.zarr))
+        print(group_tree(z))
 
         # let Xarray traverse the store
+        x = res.xarray
+        print("\n", "-" * 79, "\n")
+        print(x)
         print()
-        print(res.xarray)
 
         # inspect current and previous generations
         p: XarrayStoragePartition | None = res.partition
         while p is not None:
-            # look for expected fields in the root node
-            assert len(res.xarray.attrs[p.sim_id])
-            assert p.time_var_name in res.xarray.attrs
-            assert p.time_coo_name in res.xarray.coords
-            assert p.time_var_name in res.xarray.data_vars
+            # traverse the store tree
+            cls.check_root_node_shape(p, x)
+            t_size = len(x._data_variables[p.time_var_name])
+            for tree in view.forest:
+                for leaf in tree.leaves:
+                    cls.check_child_node_shape(p, t_size, leaf, x)
             p = p.parent if p.generation > 1 else None
 
     @staticmethod
-    def check_encoding(res: StoreResult) -> None:
-        pass
+    def check_root_node_shape(p: XarrayStoragePartition, n: DataTree) -> None:
+        """
+        Look for expected fields in the root node of the output store.
+
+        Called by: :py:meth:`.check_tree_shape`.
+        """
+        assert isinstance(n, DataTree)
+
+        # simulation metadata
+        assert set(n.attrs[p.sim_id].keys()) == set(XarrayEmitter.metadata_keys)
+
+        # unit annotation
+        assert p.time_var_name in n.attrs
+
+        # coordinate & data variables
+        ti = n._node_coord_variables[p.time_coo_name]
+        t = n._data_variables[p.time_var_name]
+        assert ti.shape == t.shape
 
     @staticmethod
-    def check_log(res: StoreResult) -> None:
+    def check_child_node_shape(
+        p: XarrayStoragePartition, t_size: int, leaf: LeafView, n: DataTree
+    ) -> None:
         """
-        Check the integrity of the write log.
+        Look for expected fields in a child node of the output store.
+
+        Called by: :py:meth:`.check_tree_shape`.
         """
-        assert {"sim_step", "sim_time"} == set(
-            res.xarray.attrs.get(res.partition.log_attr_name, {}).keys())
+        m = n[str(leaf.path)]
+        assert isinstance(m, DataTree)
+        v = leaf.var_name
+
+        # unit annotation
+        if leaf.unit:
+            assert isinstance(u := m.attrs[v], str) and u
+
+        # coordinate & data variables
+        assert (d := m.data_vars[p.dynamic_suffix]).shape[0] == t_size
+        if c := m._node_coord_variables:
+            assert set(c.keys()) == {o := VariableSpec.var_coo_name(v)}
+            assert d.shape[1:] == c[o].shape
+        else:
+            assert d.shape[1:] == ()
+
+    # ~~~~~~~~~~~~~~~~~ #
 
     @staticmethod
-    def check_success(res: StoreResult, success: bool) -> None:
+    def check_log(res: StoreResult, success: bool) -> None:
         """
-        Check the validity of the success flag.
+        Check the integrity of the write log and the validity of the success
+        flag for *the latest emitted generation*.
         """
+        assert {"sim_step", "sim_time"} == set(
+            res.xarray.attrs.get(res.partition.log_attr_name, {}).keys())
         assert success == res.xarray.attrs.get(
             res.partition.success_attr_name, False)
 
+    # ~~~~~~~~~~~~~~~~~ #
+
     @staticmethod
     def check_time(res: StoreResult, interval: int) -> None:
         """
-        Check the validity of the time variable.
+        Check the validity of the time variable for *the latest emitted
+        generation*.
         """
         # attribute names
         sim_id = res.partition.sim_id
@@ -307,3 +379,228 @@ def check_time(res: StoreResult, interval: int) -> None:
         assert t.values.min() == t_01[0]
         assert t.values.max() == t_end
         assert np.array_equiv(np.diff(t), idt)
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @classmethod
+    def check_chunks(
+        cls, res: StoreResult, view: ForestView,
+        interval: int, buffers_per_chunk: int, config: dict[str, Any]
+    ) -> None:
+        """
+        Check the integrity of all Zarr chunks for *the latest emitted
+        generation*.
+
+        Calls: :py:meth:`.check_root_node_chunks` and
+        :py:meth:`.check_child_node_chunks`.
+        """
+        # config variables
+        p = res.partition
+        T: float = config["max_duration"]
+        dt: float = config["time_step"]
+        cnf = config["emitter_arg"]["transducer"]["predicate"]
+        pred = {"subsample": {"interval": interval}}
+        assert any(pred in clause for clause in cnf)
+        b: int = config["emitter_arg"]["transducer"]["buffer"]["size"]
+        c: int = config["emitter_arg"]["writer"]["buffers_per_chunk"]
+        assert buffers_per_chunk == c
+
+        # store accessor
+        def z(path: str | NodePath) -> Array:
+            return cast(Array, res.zarr[str(path)])
+
+        # traverse the store tree
+        t_size = 1 + int(T / dt) // interval
+        c_size = b * c
+        cls.check_root_node_chunks(p, t_size, c_size, z)
+        for tree in view.forest:
+            for leaf in tree.leaves:
+                cls.check_child_node_chunks(p, t_size, c_size, leaf, z)
+
+    @staticmethod
+    def check_root_node_chunks(
+        p: XarrayStoragePartition, t_size: int, c_size: int,
+        g: Callable[[str | NodePath], Array]
+    ) -> None:
+        """
+        Check the integrity of the Zarr chunks in the root node of the output
+        store.
+
+        Called by: :py:meth:`.check_chunks`.
+        """
+        # data variable
+        t = g(p.time_var_name)
+        assert t.shape == (t_size,)
+        assert t.chunks == (c_size,)
+
+        # coordinate variable
+        ti = g(p.time_coo_name)
+        assert ti.shape == (t_size,)
+        assert ti.chunks == (c_size,)
+
+    @staticmethod
+    def check_child_node_chunks(
+        p: XarrayStoragePartition, t_size: int, c_size: int,
+        leaf: LeafView, g: Callable[[str | NodePath], Array]
+    ) -> None:
+        """
+        Check the integrity of the Zarr chunks in a child node of the output
+        store.
+
+        Called by: :py:meth:`.check_chunks`.
+        """
+        # data variable
+        d = g(leaf.path / p.dynamic_suffix)
+        assert d.shape[0] == t_size
+        assert d.chunks[0] == c_size
+
+        # coordinate variable
+        try:
+            c = g(leaf.path / VariableSpec.var_coo_name(leaf.var_name))
+            assert d.shape[1:] == c.shape
+            assert d.chunks[1:] == c.chunks
+            assert c.shape == c.chunks
+        except KeyError:
+            assert d.shape[1:] == ()
+            assert d.chunks[1:] == ()
+
+    # ~~~~~~~~~~~~~~~~~ #
+
+    @classmethod
+    def check_codecs(
+        cls, res: StoreResult, view: ForestView,
+        zarr_format: Literal[2, 3], config: dict[str, Any]
+    ) -> None:
+        """
+        Check the integrity of all Zarr codecs for *the latest emitted
+        generation*.
+
+        Calls: :py:meth:`.check_root_node_codecs` and
+        :py:meth:`.check_child_node_codecs`.
+        """
+        # config variables
+        p = res.partition
+        b: int = config["emitter_arg"]["transducer"]["buffer"]["size"]
+
+        # transport backend
+        writer = AsyncZarrBufferWriter(config["emitter_arg"]["writer"])
+
+        # store accessor
+        def z(path: str | NodePath) -> Array:
+            return cast(Array, res.zarr[str(path)])
+
+        # traverse the store tree
+        cls.check_root_node_codecs(p, writer, zarr_format, b, z)
+        for tree in view.forest:
+            for leaf in tree.leaves:
+                cls.check_child_node_codecs(p, writer, zarr_format, leaf, z)
+
+    @classmethod
+    def check_root_node_codecs(
+        cls, p: XarrayStoragePartition, writer: AsyncZarrBufferWriter,
+        zarr_format: Literal[2, 3], b: int,
+        g: Callable[[str | NodePath], Array]
+    ) -> None:
+        """
+        Check the integrity of the Zarr codecs in the root node of the output
+        store.
+
+        Called by: :py:meth:`.check_codecs`.
+
+        Calls: :py:meth:`.compare_zarr_codecs`.
+        """
+        time_spec = VariableSpec.make_time(p, b)
+        # coordinate variable
+        cls.compare_zarr_codecs(zarr_format,
+                                writer._coo_codecs(zarr_format, time_spec),
+                                g(p.time_coo_name))
+        # data variable
+        cls.compare_zarr_codecs(zarr_format,
+                                writer._var_codecs(zarr_format, time_spec),
+                                g(p.time_var_name))
+
+    @classmethod
+    def check_child_node_codecs(
+        cls, p: XarrayStoragePartition, writer: AsyncZarrBufferWriter,
+        zarr_format: Literal[2, 3], leaf: LeafView,
+        g: Callable[[str | NodePath], Array]
+    ) -> None:
+        """
+        Check the integrity of the Zarr codecs in a child node of the output
+        store.
+
+        Called by: :py:meth:`.check_codecs`.
+
+        Calls: :py:meth:`.compare_zarr_codecs`.
+        """
+        v = leaf.var_name
+        var_spec = VariableSpec(
+            # skip coord array construction for the purposes of this test
+            partition=p, coord=None,
+            var_name=v, dtype=leaf.dtype, unit=leaf.unit,
+            codecs=leaf.codecs)
+        # data variable
+        cls.compare_zarr_codecs(zarr_format,
+                                writer._var_codecs(zarr_format, var_spec),
+                                g(leaf.path / p.dynamic_suffix))
+        # coordinate variable
+        try:
+            cls.compare_zarr_codecs(zarr_format,
+                                    writer._coo_codecs(zarr_format, var_spec),
+                                    g(leaf.path / VariableSpec.var_coo_name(v)))
+        except KeyError:
+            pass
+
+    @classmethod
+    def compare_zarr_codecs(
+        cls, zarr_format: Literal[2, 3], spec: VariableEncoding, array: Array
+    ) -> None:
+        """
+        Compare the codec specified by a :py:class:`.VariableSpec` with the
+        codec retrieved from the corresponding store array metadata.
+
+        Called by: :py:meth:`.check_root_node_codecs` and
+        :py:meth:`.check_child_node_codecs`.
+
+        Calls: :py:meth:`.zarr_codec_key`.
+        """
+        # define comparison key
+        assert isinstance(spec, dict)
+        assert isinstance(array, Array)
+        codec_key = partial(cls.zarr_codec_key, zarr_format)
+        for k in ["filters", "compressors"]:
+            spec_k = [] if (spec_k := spec.get(k)) is None else spec_k
+            array_k = getattr(array, k)
+            assert set(map(codec_key, spec_k)) == set(map(codec_key, array_k))
+
+    @staticmethod
+    def zarr_codec_key(zarr_format: Literal[2, 3], codec: Any) -> tuple:
+        """
+        Hashable partial Zarr codec specification, used as a comparison key.
+        This key avoids direct comparisons for those configuration options that
+        may be set adaptively by Zarr during the encoding process.
+
+        Called by: :py:meth:`.compare_zarr_codecs`.
+        """
+        z = zarr_format
+        if (d := codec.get_config() if z == 2 else codec.to_dict()):
+            c = d if z == 2 else d["configuration"]
+            match (n := d["id"] if z == 2 else d["name"]):
+                case "zstd":
+                    return (n, c["level"])
+                case "delta" if z == 2:
+                    return (n, c["dtype"])
+                case "numcodecs.delta" if z == 3:
+                    return (n, c["dtype"])
+                case "lzma" if z == 2:
+                    return (n, c["format"],
+                            tuple(sorted(f["id"] for f in c["filters"])))
+                case "numcodecs.lzma" if z == 3:
+                    return (n, c["format"],
+                            tuple(sorted(f["id"] for f in c["filters"])))
+                case "blosc":
+                    return (n, c["cname"], c["clevel"])
+                case _:
+                    raise NotImplementedError
+        else:
+            return ()
diff --git a/ecoli/library/xarray_emitter/transducer.py b/ecoli/library/xarray_emitter/transducer.py
index 2523b55f3..1249fb6e2 100644
--- a/ecoli/library/xarray_emitter/transducer.py
+++ b/ecoli/library/xarray_emitter/transducer.py
@@ -117,9 +117,10 @@ def output_paths(self) -> dict[HierarchyPath, tuple[NodePath, str]]:
     def modified_paths(self) -> set[NodePath]:
         """
         Relative paths inside the independent substore that are modified during
-        a *daughter* generation. This information may be used by
-        :py:class:`.AsyncBufferWriter` backends for maintaining metadata
-        consistency.
+        a *daughter* generation.
+
+        Possibly called by: :py:meth:`.AsyncBufferWriter.merge_attributes` and
+        :py:meth:`.AsyncBufferWriter.consolidate`.
         """
         return {NodePath()}
 
@@ -127,15 +128,14 @@ def modified_paths(self) -> set[NodePath]:
     def added_paths(self) -> set[NodePath]:
         """
         Relative paths inside the independent substore that are added during a
-        *daughter* generation. This information may be used by
-        :py:class:`.AsyncBufferWriter` backends for maintaining metadata
-        consistency.
+        *daughter* generation.
+
+        Possibly called by: :py:meth:`.AsyncBufferWriter.consolidate`.
         """
         root_paths = set(map(NodePath, self.root._variables.keys()))
-        child_var_paths = set(
-            path / cast(str, var)
-            for (path, node) in self.child_vars.items()
-            for var in node._variables.keys())
+        child_var_paths = set(path / cast(str, var)
+                              for (path, node) in self.child_vars.items()
+                              for var in node._variables.keys())
         return child_var_paths | root_paths
 
     # ~~~~~~~~~~~~~~~~~ #
@@ -185,7 +185,7 @@ def alloc(self, buf_size: int, metadata: dict) -> None:
           buf_size: :py:attr:`.XarrayTransducer.buf_size`.
           metadata: Result of :py:meth:`.XarrayEmitter.extract_metadata`.
         """
-        assert not(self.child_coords)
+        assert not(self.child_vars)
         self.time_spec = VariableSpec.make_time(self.partition, buf_size)
         self.root = self.time_spec.alloc_time(buf_size).assign_attrs(
             VariableSpec.alloc_metadata(self.partition, metadata)._attrs)
@@ -193,6 +193,32 @@ def alloc(self, buf_size: int, metadata: dict) -> None:
             self.child_coords[path] = var.alloc_coord()
             self.child_vars[path] = var.alloc_var(buf_size)
 
+    def encodings(
+        self, writer: AsyncBufferWriter, buf_size: int, *, include_coo: bool
+    ) -> dict[str, VariableEncoding]:
+        r"""
+        Determine encoding parameters for all variables.
+
+        Called by: :py:meth:`.XarrayTransducer.flush`.
+
+        Calls: :py:meth:`.VariableSpec.encoding`.
+
+        Args:
+          writer:       Used for choosing backend-specific
+                        :py:type:`.VariableEncoding`\ s.
+          buf_size:     :py:attr:`.XarrayTransducer.buf_size`.
+          include_coo:  Include :py:type:`.VariableEncoding`\ s for
+                        :py:attr:`.child_coords`.
+        """
+        assert self.child_vars
+        enc: dict[str, VariableEncoding] = {}
+        enc[""] = self.time_spec.encoding(writer, buf_size, include_coo=True)
+        for (path, var) in self.var_specs.items():
+            enc[str(path)] = var.encoding(writer, buf_size, include_coo=include_coo)
+        return enc
+
+    # ~~~~~~~~~~~~~~~~~ #
+
     def write(
         self, buf_tix: int, sim_tix: int, t: float, data: dict[str, Any], /
     ) -> None:
@@ -247,25 +273,17 @@ def write(
         if len(emit_queue) and sim_tix > 0:
             raise KeyError(f"Missing emit paths: {list(emit_queue)}")
 
-    def render(
-        self, writer: AsyncBufferWriter | None, buf_size: int,
-        *, include_static: bool, copy: bool
-    ) -> tuple[xarray.DataTree, dict[str, VariableEncoding]]:
+    def render(self, *, include_coo: bool, copy: bool) -> xarray.DataTree:
         r"""
         Assemble the output buffer components.
 
         Called by: :py:meth:`.XarrayTransducer.flush`.
 
-        Calls: :py:meth:`.VariableSpec.encoding` and
-        :py:meth:`xarray.DataTree.from_dict`.
+        Calls: :py:meth:`xarray.DataTree.from_dict`.
 
         Args:
-          writer:         Used for choosing backend-specific
-                          :py:type:`.VariableEncoding`\ s.
-          buf_size:       :py:attr:`.XarrayTransducer.buf_size`.
-          include_static: Include :py:attr:`.child_coords`
-                          and all :py:type:`.VariableEncoding`\ s.
-          copy:           Return a deep copy of arrays.
+          include_coo:  Include :py:attr:`.child_coords`.
+          copy:         Return a deep copy of arrays.
 
         .. note::
           The deep copy performed here is a conservative choice, which allows
@@ -295,17 +313,12 @@ def render(
 
         # fetch child nodes
         assert set(self.child_coords) == set(self.child_vars)
-        match (include_static, copy):
-            case (False, False):
-                children = self.child_vars
-            case (False, True):
-                children = {
-                    p: n._copy(deep=True)
-                    for (p, n) in self.child_vars.items()}
+        match (include_coo, copy):
             case (True, False):
                 children = {
-                    # `self.child_vars[p]` holds only `data_vars` by construction
-                    p: c.assign(self.child_vars[p]._variables)
+                    p: c.assign(
+                        # holds only `data_vars` by construction
+                        self.child_vars[p]._variables)
                     for (p, c) in self.child_coords.items()}
             case (True, True):
                 children = {
@@ -313,22 +326,29 @@ def render(
                         k: v._copy(deep=True)
                         for (k, v) in self.child_vars[p]._variables.items()})
                     for (p, c) in self.child_coords.items()}
+            case (False, False):
+                children = {
+                    p: n.assign_attrs(
+                        # always resend attributes, in order to avoid erasure by
+                        # `xarray.backends.writers.dump_to_store()` (xarray==2026.04)
+                        **self.child_coords[p].attrs)
+                    for (p, n) in self.child_vars.items()}
+            case (False, True):
+                children = {
+                    p: n._copy(deep=True).assign_attrs(
+                        **self.child_coords[p].attrs)
+                    for (p, n) in self.child_vars.items()}
 
-        # assemble nodes
+        # assemble output tree
         buf = DataTree.from_dict(cast(dict[str, Dataset], root | children))
 
         # check consistency between composition logic and update logic
         assert set(str(NodePath("/") / p.parent)
                    for p in (self.added_paths | self.modified_paths)
                    ).issubset(buf.groups)
+        return buf
 
-        # fetch encodings
-        enc: dict[str, VariableEncoding] = {}
-        if include_static and writer is not None:
-            enc |= {"": self.time_spec.encoding(writer, buf_size)}
-            enc |= {str(path): var.encoding(writer, buf_size)
-                    for (path, var) in self.var_specs.items()}
-        return (buf, enc)
+    # ~~~~~~~~~~~~~~~~~ #
 
     def get_time(self, buf_tix: int) -> float:
         """
@@ -466,8 +486,7 @@ def validate_config(cls, config: dict[str, Any], /) -> None:
                     f"\"buffer\": {{\"size\": {buf_size}}}"))
 
     def __str__(self) -> str:
-        return self.display(self.buffer.render(
-            None, self.buf_size, include_static=True, copy=False)[0])
+        return self.display(self.buffer.render(include_coo=True, copy=False))
 
     def display(self, buf: DataTree, /) -> str:
         return (
@@ -507,6 +526,8 @@ def alloc(
         self.buffer.alloc(self.buf_size, metadata)
         self.check_buffer()
 
+    # ~~~~~~~~~~~~~~~~~ #
+
     def step(self, data: dict[str, Any], /) -> bool:
         r"""
         If :py:attr:`.predicate` is satisfied for the current *simulation step*
@@ -542,7 +563,7 @@ def step(self, data: dict[str, Any], /) -> bool:
         return True
 
     def flush(
-        self, writer: AsyncBufferWriter, *, include_static: bool, final: bool
+        self, writer: AsyncBufferWriter, *, final: bool
     ) -> tuple[xarray.DataTree, dict[str, VariableEncoding], dict[str, Any]]:
         r"""
         Assemble the output buffer that will be sent to persistent storage, and
@@ -550,36 +571,53 @@ def flush(
 
         Called by: :py:meth:`.AsyncBufferWriter.write`.
 
-        Calls: :py:meth:`.XarrayBuffer.render` and
+        Calls: :py:meth:`.AsyncBufferWriter.is_1st_buf_in_lineage`,
+        :py:meth:`.AsyncBufferWriter.is_1st_buf_in_generation`,
+        :py:meth:`.XarrayBuffer.render`, :py:meth:`.XarrayBuffer.encodings` and
         :py:meth:`.AsyncBufferWriter.merge_attributes`.
 
         Args:
-          writer:         Used for choosing backend-specific
-                          :py:type:`.VariableEncoding`\ s and for combining
-                          metadata.
-          include_static: Include :py:attr:`.XarrayBuffer.child_coords`
-                          and all :py:type:`.VariableEncoding`\ s.
-          final:          Indicate the final buffer.
+          writer: Used for deciding when to emit coordinate data, for choosing
+                  backend-specific :py:type:`.VariableEncoding`\ s, and for
+                  calling the hook :py:meth:`.AsyncBufferWriter.merge_attributes`.
+          final:  Indicates the final buffer in a generation, which does not
+                  require deep copying.
 
         Returns:
-          - A deep copy of the in-memory buffer.
-          - Backend-specific variable encodings, only if ``include_static``.
+          - A deep copy of the in-memory buffer, including
+            :py:attr:`.XarrayBuffer.child_coords` only for the first buffer in a
+            lineage.
+          - Backend-specific :py:type:`.VariableEncoding`\ s, computed only for
+            the first buffer in a generation.
           - A JSON-serializable reference to the latest emitted simulation step.
         """
+        # prelude
         self.check_buffer()
         if final:
-            assert not (self.buf_shifts and include_static)
             if self.buf_tix < self.buf_size:
                 # at least one unfilled emit step inside allocated buffer
                 self.truncate()
         else:
             assert self.buf_tix == self.buf_size
-        (buf, enc) = self.buffer.render(
-            writer, self.buf_size,
-            include_static=include_static, copy=not final)
+
+        # fetch buffer data
+        include_coo = writer.is_1st_buf_in_lineage
+        buf = self.buffer.render(include_coo=include_coo, copy=not final)
+
+        # fetch buffer encodings
+        include_enc = writer.is_1st_buf_in_generation
+        assert not (include_enc and self.buf_shifts)
+        enc = (
+            self.buffer.encodings(writer, self.buf_size, include_coo=include_coo)
+            if include_enc
+            else {})
+
+        # attach session metadata
         writer.merge_attributes(buf)
         ref = {"sim_step": self.emitted_sim_tix,
                "sim_time": self.buffer.get_time(self.buf_tix - 1)}
+
+        # postlude
         if final:
             # reference to buffer components no longer needed
             self.clear()
@@ -588,6 +626,8 @@ def flush(
             print(hline, "\n", self.display(buf), "\n", hline)
         return (buf, enc, ref)
 
+    # ~~~~~~~~~~~~~~~~~ #
+
     def shift(self) -> None:
         """
         Shift the time coordinate by the buffer size, without modifying the
diff --git a/ecoli/library/xarray_emitter/writer.py b/ecoli/library/xarray_emitter/writer.py
index a5cb8f52a..8456ec6ed 100644
--- a/ecoli/library/xarray_emitter/writer.py
+++ b/ecoli/library/xarray_emitter/writer.py
@@ -199,7 +199,7 @@ def __init__(self, config: dict[str, Any], /) -> None:
         """ Synchronisation primitive for :py:attr:`.executor`. """
         self.future.set_result(None)
         self.num_writes: int = 0
-        """ Count of submitted buffer writes. """
+        """ Count of buffers submitted to :py:attr:`.executor`. """
 
     @classmethod
     def validate_config(cls, config: dict[str, Any], /) -> None:
@@ -322,7 +322,7 @@ def close(self) -> None:
         Terminate the :py:attr:`.executor` thread, call :py:meth:`.consolidate`,
         and close the :py:attr:`.store`.
         """
-        if self.num_writes > 0:
+        if not self.is_1st_buf_in_generation:
             self.sync(shutdown=True)
         self.executor.shutdown(wait=True)
         self.consolidate()
@@ -391,14 +391,16 @@ def warnings_all(cls) -> list[WarningFilter]:
     def merge_attributes(self, payload: DataTree) -> None:
         """
         :py:meth:`.XarrayBuffer.render` is designed to only output chunk-level
-        changes to Xarray variables and attributes. While variables are always
-        either introduced or appended, some transport layer backends may
-        *overwrite* attribute containers instead of *updating* them, which would
-        invalidate attributes at :py:attr:`.XarrayBuffer.modified_paths`. This
-        method allows such conflicts to be resolved in-place, before the payload
-        is passed to :py:meth:`.make_effect`.
+        *updates* to Xarray variables and attributes. However, while coordinate
+        and data variables are always either introduced or appended, attribute
+        containers may be *overwritten* instead of *updated* by some transport
+        layer backends, which would invalidate them. This hook allows such
+        conflicts to be resolved in memory, before the corrected payload is
+        passed to :py:meth:`.make_effect`.
 
         Called by: :py:meth:`.XarrayTransducer.flush`.
+
+        Possibly calls: :py:attr:`.XarrayBuffer.modified_paths`.
         """
         ...
 
@@ -478,6 +480,35 @@ def consolidate(self) -> None:
 
     # ~~~~~~~~~~~~~~~~~ #
 
+    @property
+    def is_1st_buf_in_lineage(self) -> bool:
+        """
+        Logical *global* time predicate for :py:class:`.AsyncBufferWriter`,
+        indicating that the currently active :py:class:`.XarrayBuffer` cycle --
+        i.e., the one that will be sent to :py:attr:`.executor` next -- is the
+        first in a *cell lineage* simulation.
+
+        Calls: :py:meth:`.is_1st_buf_in_generation`.
+
+        Called by: :py:meth:`.XarrayTransducer.flush`.
+        """
+        return self.partition.generation == 1 and self.is_1st_buf_in_generation
+
+    @property
+    def is_1st_buf_in_generation(self) -> bool:
+        """
+        Logical *local* time predicate for :py:class:`.AsyncBufferWriter`,
+        indicating that the currently active :py:class:`.XarrayBuffer` cycle --
+        i.e., the one that will be sent to :py:attr:`.executor` next -- is the
+        first in a *cell generation* simulation.
+
+        Called by: :py:meth:`.is_1st_buf_in_lineage`, :py:meth:`.write`,
+        :py:meth:`.XarrayTransducer.flush` and :py:meth:`.close`.
+        """
+        return self.num_writes == 0
+
+    # ~~~~~~~~~~~~~~~~~ #
+
     def write(self, transducer: XarrayTransducer, *, final: bool) -> None:
         """
         Concurrently write a buffer to the open store, synchronising only at the
@@ -487,18 +518,12 @@ def write(self, transducer: XarrayTransducer, *, final: bool) -> None:
         :py:meth:`._write`.
 
         Args:
-          final: Indicates the final buffer, which does not require copying.
+          final: Indicates the final buffer in a *cell generation* simulation,
+                 which does not require deep copying.
         """
         assert self.num_writes >= 0
-        msg = transducer.flush(
-            # choose backend-specific encodings
-            self,
-            # emit coordinate data and encodings only with first trajectory buffer
-            include_static=(
-                self.partition.generation == 1 and self.num_writes == 0),
-            # final trajectory buffer does not require copying
-            final=final)
-        if self.num_writes > 0:
+        msg = transducer.flush(self, final=final)
+        if not self.is_1st_buf_in_generation:
             # finish writing previous buffer and update transport cache
             self.sync()
         self.future = self.executor.submit(self._write, *msg)
diff --git a/ecoli/library/xarray_emitter/zarr_writer.py b/ecoli/library/xarray_emitter/zarr_writer.py
index e39f43f29..b1fb33434 100644
--- a/ecoli/library/xarray_emitter/zarr_writer.py
+++ b/ecoli/library/xarray_emitter/zarr_writer.py
@@ -14,7 +14,7 @@
 from collections import deque
 from dataclasses import replace
 from html import escape as html_escape
-from typing import Any, Mapping, final, cast
+from typing import Any, Literal, Mapping, final, cast
 import sys
 import warnings
 
@@ -27,9 +27,12 @@
 from zarr.abc.codec import Codec
 from zarr.abc.numcodec import Numcodec
 from zarr.core.metadata import v2, v3
+from zarr.core.dtype import parse_dtype
 from zarr.core._tree import TreeRepr
 from zarr.types import AnyAsyncArray
-from zarr.core.array import Array, AsyncArray
+from zarr.core.array import (
+    Array, AsyncArray,
+    _parse_chunk_encoding_v2, default_filters_v3, default_compressors_v3)
 from zarr.core.sync import sync
 from zarr.core.group import (
     Group, AsyncGroup, GroupMetadata, ConsolidatedMetadata, _getitem_semaphore)
@@ -54,7 +57,10 @@
     2: [{"id": "delta", "dtype": None}],
     3: [{"name": "numcodecs.delta", "configuration": {"dtype": None}}]
 }
-""" Default filter codecs, as a function of the Zarr format. """
+"""
+Default filter codecs for :py:meth:`.AsyncZarrBufferWriter.var_codecs`, as a
+function of the Zarr format.
+"""
 ZARR_COMPRESSORS: dict[int, list[dict[str, Any]]] = {
     2: [{"id": "blosc", "cname": "zstd", "clevel": 6,
          "shuffle": -1, "blocksize": 0}],
@@ -62,7 +68,10 @@
         "cname": "zstd", "clevel": 6,
         "typesize": None, "shuffle": None, "blocksize": 0}}]
 }
-""" Default compression codecs, as a function of the Zarr format. """
+"""
+Default compression codecs for :py:meth:`.AsyncZarrBufferWriter.var_codecs`, as
+a function of the Zarr format.
+"""
 
 
 # ==============================================================================
@@ -649,23 +658,48 @@ def _open_store(self) -> ZarrStore:
 
     def coo_codecs(self, var: VariableSpec, /) -> VariableEncoding:
         """
-        Currently, no Zarr codecs are applied to coordinate arrays.
+        Currently, only Zarr's own default codecs are applied to a coordinate
+        array.
         """
-        return {}
+        return self._coo_codecs(self.group.metadata.zarr_format, var)
 
     def var_codecs(self, var: VariableSpec, /) -> VariableEncoding:
         """
-        Parse the Zarr codecs for a simulation variable, if they are specified
-        in the JSON config, and otherwise, apply the default codecs.
+        Parse the Zarr codecs for a data array, if they are specified in the
+        JSON config, and otherwise, apply :py:const:`ZARR_FILTERS` and
+        :py:const:`ZARR_COMPRESSORS`.
         """
-        z: int = self.group.metadata.zarr_format
+        return self._var_codecs(self.group.metadata.zarr_format, var)
+
+    @classmethod
+    def _coo_codecs(
+        cls, zarr_format: Literal[2, 3], var: VariableSpec, /
+    ) -> VariableEncoding:
+        dtype = parse_dtype(var.dtype, zarr_format=zarr_format)
+        # parse default config
+        filters: tuple[Codec | Numcodec, ...] | None
+        compressors: tuple[Codec | Numcodec | None, ...]
+        if zarr_format == 2:
+            filters, compressor = _parse_chunk_encoding_v2(
+                filters="auto", compressor="auto", dtype=dtype)
+            compressors = (compressor,)
+        else:
+            filters = default_filters_v3(dtype)
+            compressors = default_compressors_v3(dtype)
+        return {"filters": filters, "compressors": compressors}
+
+    @classmethod
+    def _var_codecs(
+        cls, zarr_format: Literal[2, 3], var: VariableSpec, /
+    ) -> VariableEncoding:
+        z = zarr_format
         if var.codecs:
             # fetch variable-specific JSON config
             _filters = var.codecs.get(f"filters_v{z}", [])
             _compressors = var.codecs.get(f"compressors_v{z}", [])
             if not (_filters or _compressors):
                 raise ValueError(emitter_arg_error(
-                    self, "Missing arguments",
+                    cls, "Missing arguments",
                     f"...: {{\"codecs\": "
                     f"{{\"filters_v{z}\": ..., \"compressors_v{z}\": ...}}}}"))
         else:
@@ -680,7 +714,7 @@ def var_codecs(self, var: VariableSpec, /) -> VariableEncoding:
         # parse codec config
         filters: tuple[Codec | Numcodec, ...] | None
         compressors: tuple[Codec | Numcodec | None, ...]
-        with filter_warnings(self._warnings_make_effect):
+        with filter_warnings(cls.warnings_make_effect()):
             if z == 2:
                 filters = v2.parse_filters(_filters)
                 compressors = tuple(map(v2.parse_compressor, _compressors))
@@ -739,12 +773,13 @@ def merge_attributes(self, payload: DataTree) -> None:
         """
         Combine attributes from the existing Zarr store and the Xarray buffer
         update at :py:attr:`.XarrayBuffer.modified_paths`.
+
+        Calls: :py:attr:`.XarrayBuffer.modified_paths`.
         """
         for path in self.buffer.modified_paths:
             # empty in-memory attribute containers do not produce write operations
-            if (xr_attrs := payload._get_item(path).attrs):
-                zr_attrs = dict(self.get_zarr_path(path).attrs)
-                payload._get_item(path).attrs = zr_attrs | xr_attrs
+            if (node := payload._get_item(path)).attrs:
+                node.attrs = dict(self.get_zarr_path(path).attrs) | node.attrs
 
     def make_effect(
         self, payload: DataTree, encoding: Mapping[str, Any], /
@@ -765,7 +800,7 @@ def update_transport(self) -> None:
         generation-specific time axis.
         """
         assert self.group.metadata.consolidated_metadata is None
-        assert self.num_writes > 0
+        assert not self.is_1st_buf_in_generation
         if self.num_writes == 1:
             with filter_warnings(self._warnings_eval_effect):
                 # find direct children in the Zarr hierarchy
@@ -780,7 +815,9 @@ def consolidate(self) -> None:
         Update existing consolidated metadata in the Zarr store with the outputs
         of a newly finished simulation.
 
-        Calls: :py:func:`zarr.consolidate_metadata` or
+        Calls: Either :py:func:`zarr.consolidate_metadata`, or
+        :py:attr:`.XarrayBuffer.modified_paths`,
+        :py:attr:`.XarrayBuffer.added_paths` and
         :py:func:`.reconsolidate_metadata`.
         """
         assert self.group.metadata.consolidated_metadata is None
diff --git a/runscripts/test_workflow.py b/runscripts/test_workflow.py
index e54676fa5..88927d099 100644
--- a/runscripts/test_workflow.py
+++ b/runscripts/test_workflow.py
@@ -22,6 +22,7 @@
 import sys
 from dataclasses import dataclass, field
 from pathlib import Path
+from typing import Any
 from unittest.mock import patch
 
 import pytest
@@ -153,6 +154,8 @@ class MockEcoliSimWorkflow:
     #: - Passed to :py:class:`.EcoliSim` via the CLI arguments
     #:   ``--emitter`` and ``--emitter_arg``.
     emitter_config: PatchConfig
+    #: Result of combining :py:attr:`.config_file` and :py:attr:`.emitter_config`.
+    config: dict[str, Any] = field(init=False)
 
     # ~~~~~~~~~~~~~~~~~ #
 
@@ -228,9 +231,10 @@ def init_sim(self, success: bool, /) -> EcoliSim:
 
         # configure the emitter parameters
         config.update_from_dict(self.emitter_config.to_dict())
+        self.config = config.to_dict()
 
         # construct the simulation state
-        sim = EcoliSim(config.to_dict())
+        sim = EcoliSim(self.config)
         with patch_func("ecoli.composites.ecoli_master.get_state_from_file") as f:
             sim.build_ecoli()
             if self.generation == 1:
@@ -269,7 +273,7 @@ def _check_complete(_: Engine):
 
     # ~~~~~~~~~~~~~~~~~ #
 
-    def sim_gen(self, success: bool, /) -> StoragePartition:
+    def sim_gen(self, success: bool, /) -> tuple[StoragePartition, dict[str, Any]]:
         """
         Emulate ``runscripts/nextflow/sim.nf::{simGen0,sim}()`` by starting a
         single-generation simulation, stopping at ``config["max_duration"]``,
@@ -279,7 +283,11 @@ def sim_gen(self, success: bool, /) -> StoragePartition:
         Calls: :py:meth:`.init_sim`.
 
         Args:
-            success: Flag for emulating a :py:exc:`.DivisionDetected` event.
+          success: Flag for emulating a :py:exc:`.DivisionDetected` event.
+
+        Returns:
+          - :py:class:`.StoragePartition` of the resulting simulation.
+          - Full configuration of the resulting simulation.
         """
         # sanity check the mock generation state
         assert self.sim is None
@@ -308,7 +316,7 @@ def sim_gen(self, success: bool, /) -> StoragePartition:
         self.agent_id += "0"
         self.generation += 1
         self.sim_seed += 1
-        return partition
+        return (partition, self.config)
 
 
 # ==============================================================================

From 5649bfbe42b3f7c10ff9f8368453c1d834ac65eb Mon Sep 17 00:00:00 2001
From: ntfrgl <b.beronov@gmail.com>
Date: Sun, 17 May 2026 17:50:47 -0700
Subject: [PATCH 4/4] Update dependency: `zarr==3.2`

---
 doc/conf.py                                 | 1 +
 ecoli/library/xarray_emitter/zarr_writer.py | 6 +++---
 pyproject.toml                              | 6 +++---
 uv.lock                                     | 8 ++++----
 4 files changed, 11 insertions(+), 10 deletions(-)

diff --git a/doc/conf.py b/doc/conf.py
index 06ffe1a0e..142d7857f 100644
--- a/doc/conf.py
+++ b/doc/conf.py
@@ -100,6 +100,7 @@
     # Sphinx does not recognize type aliases
     ("py:type", "VariableEncoding"),
     ("py:class", "VariableEncoding"),
+    ("py:class", "AnyAsyncArray"),
 ]
 
 
diff --git a/ecoli/library/xarray_emitter/zarr_writer.py b/ecoli/library/xarray_emitter/zarr_writer.py
index b1fb33434..e93faf8c8 100644
--- a/ecoli/library/xarray_emitter/zarr_writer.py
+++ b/ecoli/library/xarray_emitter/zarr_writer.py
@@ -163,7 +163,7 @@ async def consolidate_metadata(
         k: v.metadata
         async for (k, v) in
         group.members(max_depth=None, use_consolidated_for_children=False)}
-    # TODO: fix in `consolidate_metadata()` (zarr==3.1.6)
+    # TODO: fix in `consolidate_metadata()` (zarr==3.2.1)
     members_metadata |= {"": group.metadata}
 
     # combine and write consolidated metadata
@@ -232,7 +232,7 @@ async def reconsolidate_metadata(
                     v, ConsolidatedMetadata(metadata={}))
     members_metadata |= mod_members_metadata | add_members_metadata
     del old_keys, mod_members_metadata, add_members_metadata
-    # TODO: fix in `ConsolidatedMetadata._flat_to_nested()` (zarr==3.1.6)
+    # TODO: fix in `ConsolidatedMetadata._flat_to_nested()` (zarr==3.2.1)
     members_metadata = dict(sorted(members_metadata.items(),
                                    key=lambda kv: bfs_key(kv[0])))
     ConsolidatedMetadata._flat_to_nested(members_metadata)
@@ -359,7 +359,7 @@ async def group_tree_async(
     # Group members by parent key so we can render the tree level by level.
     nodes: dict[str, list[tuple[str, Any]]] = {}
     for key, node in members:
-        # TODO: fix in `group_tree_async()` (zarr==3.1.6)
+        # TODO: fix in `group_tree_async()` (zarr==3.2.1)
         if key == "":
             # avoid self-loop at root node
             continue
diff --git a/pyproject.toml b/pyproject.toml
index 81559e902..b5c03aafa 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -36,9 +36,9 @@ dependencies = [
     "polars",
     "xarray>=2026.04",
     # concurrency control in `ecoli.library.xarray_emitter.zarr_writer`
-    # might require adjustments for `zarr>=3.2`:
-    # https://ossci.zulipchat.com/#narrow/channel/423692-Zarr/topic/3.2E2.2E0.20release
-    "zarr~=3.1.6",
+    # might require adjustments for `zarr>=3.3`:
+    # https://github.com/zarr-developers/zarr-python/pull/3547
+    "zarr==3.2.*",
     "zarrs>=0.2",
     # future consumers of `xarray_emitter`
     # "cubed>=0.26",
diff --git a/uv.lock b/uv.lock
index dcd0434a9..327521f89 100644
--- a/uv.lock
+++ b/uv.lock
@@ -3967,7 +3967,7 @@ requires-dist = [
     { name = "vl-convert-python" },
     { name = "xarray", specifier = ">=2026.4" },
     { name = "xmltodict" },
-    { name = "zarr", specifier = "~=3.1.6" },
+    { name = "zarr", specifier = "==3.2.*" },
     { name = "zarrs", specifier = ">=0.2" },
 ]
 provides-extras = ["dev", "docs"]
@@ -4170,7 +4170,7 @@ wheels = [
 
 [[package]]
 name = "zarr"
-version = "3.1.6"
+version = "3.2.1"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "donfig" },
@@ -4180,9 +4180,9 @@ dependencies = [
     { name = "packaging" },
     { name = "typing-extensions" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/31/5a/b8a0cf39a14c770c30bd1f2d120c54000c8cd9e84e8e79f38d9a7ce58071/zarr-3.1.6.tar.gz", hash = "sha256:d95e72cbea4b90e9a70679468b8266400331756232576ae2b43400ac5108d0eb", size = 386531, upload-time = "2026-03-23T17:25:18.748Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/93/8d/aeb164004f87543b06ef54f885d02c342c31ceb274e2bbec470a98927621/zarr-3.2.1.tar.gz", hash = "sha256:71565b738a0e7e8ed226f0516eba8c6bb53440ad7669a8c48ebb3534a161d035", size = 675161, upload-time = "2026-05-05T12:37:22.383Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/de/7c/ba8ca8cbe9dbef8e83a95fc208fed8e6686c98b4719aaa0aa7f3d31fe390/zarr-3.1.6-py3-none-any.whl", hash = "sha256:b5a82c5079d1c3d4ee8f06746fa3b9a98a7d804300fa3f4be154362a33e1207e", size = 295655, upload-time = "2026-03-23T17:25:17.189Z" },
+    { url = "https://files.pythonhosted.org/packages/88/0a/469e2bd01be1490336e6c8707386845655d59261543315778a3ccc7e8019/zarr-3.2.1-py3-none-any.whl", hash = "sha256:f78cdd3d9687ad0e9f9cba2c5683b64f0c52589c19f685eeabe872e93cc0d2c7", size = 319617, upload-time = "2026-05-05T12:37:20.66Z" },
 ]
 
 [[package]]