diff --git a/src/hdmf_zarr/backend.py b/src/hdmf_zarr/backend.py
index 3dda6aa0..b3338f38 100644
--- a/src/hdmf_zarr/backend.py
+++ b/src/hdmf_zarr/backend.py
@@ -157,10 +157,22 @@ def object_codec_class(self):
     def open(self):
         """Open the Zarr file"""
         if self.__file is None:
-            self.__file = zarr.open(store=self.path,
-                                    mode=self.__mode,
-                                    synchronizer=self.__synchronizer,
-                                    storage_options=self.__storage_options)
+            # self.__file = zarr.open(store=self.path,
+            #                         mode=self.__mode,
+            #                         synchronizer=self.__synchronizer,
+            #                         storage_options=self.__storage_options)
+            # # breakpoint()
+            if self.__mode == 'w':
+                self.__file = zarr.open(store=self.path,
+                                        mode=self.__mode,
+                                        synchronizer=self.__synchronizer,
+                                        storage_options=self.__storage_options)
+            else:
+                self.__file = self.__open_file_consolidated(store=self.path,
+                                                            mode=self.__mode,
+                                                            synchronizer=self.__synchronizer,
+                                                            storage_options=self.__storage_options)
+
 
     def close(self):
         """Close the Zarr file"""
@@ -427,9 +439,10 @@ def write_builder(self, **kwargs):
                           (f_builder.__class__.__qualname__, f_builder.name, self.source))
 
         # Consolidate metadata for the entire file after everything has been written
-        zarr.consolidate_metadata(self.path, metadata_key='.zmetadata')
+        # breakpoint()
+        zarr.consolidate_metadata(store=self.path)
 
-    def consolidate_metadata(self):
+    def consolidate_metadata(self, store):
         """
         When a file is written, the metadata within the file is consolidated automatically.
         If there are any metadata changes, the user needs to consolidate the metadata again
@@ -438,22 +451,31 @@ def consolidate_metadata(self):
         Consolidate all metadata for groups and arrays within the given store into a
         single resource and put it under .zmetadata.
         """
-        zarr.consolidate_metadata(self.path, metadata_key='.zmetadata')
+        zarr.consolidate_metadata(store, metadata_key='.zmetadata')
 
-    def open_file_consolidated(self):
+    def __open_file_consolidated(self,
+                                 store,
+                                 mode,
+                                 synchronizer = None,
+                                 storage_options = None):
         """
         This method will check to see if the metadata has been consolidated, if so
         """
-        if os.path.isfile(self.path+'/.zmetadata'):
-            zarr.open_consolidated(store=self.path,
-                                   mode=self.__mode,)
+        try:
+            temp = os.path.isfile(self.path+'/.zmetadata')
+        except TypeError:
+            temp = os.path.isfile(self.path.path+'/.zmetadata')
+        if temp:
+            return zarr.open_consolidated(store=store,
+                                   mode=mode,
+                                   synchronizer=synchronizer,
+                                   storage_options=storage_options)
         else:
             msg = "Could not find consolidated metadata."
             warnings.warn(msg)
-
-            zarr.open(store=self.path,
-                      mode=self.__mode,
-                      synchronizer=self.__synchronizer)
+            return zarr.open(store=self.path,
+                             mode=self.__mode,
+                             synchronizer=self.__synchronizer)
 
     @docval({'name': 'parent', 'type': Group, 'doc': 'the parent Zarr object'},
             {'name': 'builder', 'type': GroupBuilder, 'doc': 'the GroupBuilder to write'},
@@ -604,7 +626,11 @@ def get_zarr_paths(zarr_object):
         # In Zarr the path is a combination of the path of the store and the path of the object. So we first need to
         # merge those two paths, then remove the path of the file, add the missing leading "/" and then compute the
         # directory name to get the path of the parent
-        fullpath = os.path.normpath(os.path.join(zarr_object.store.path, zarr_object.path)).replace("\\", "/")
+        if isinstance(zarr_object.store, zarr.storage.ConsolidatedMetadataStore):
+            fpath = zarr_object.store.store.path
+        else:
+            fpath = zarr_object.store.path
+        fullpath = os.path.normpath(os.path.join(fpath, zarr_object.path)).replace("\\", "/")
         # To determine the filepath we now iterate over the path and check if the .zgroup object exists at
         # a level, indicating that we are still within the Zarr file. The first level we hit where the parent
         # directory does not have a .zgroup means we have found the main file
@@ -915,7 +941,11 @@ def write_dataset(self, **kwargs):  # noqa: C901
         if isinstance(data, Array):
             # copy the dataset
             if link_data:
-                self.__add_link__(parent, data.store.path, data.name, name)
+                if isinstance(data.store, zarr.storage.ConsolidatedMetadataStore):
+                    path =  data.store.store.path
+                else:
+                    path = data.store.path
+                self.__add_link__(parent, path, data.name, name)
                 linked = True
                 dset = None
             else:
@@ -1231,7 +1261,11 @@ def read_builder(self):
         return f_builder
 
     def __set_built(self, zarr_obj, builder):
-        fpath = zarr_obj.store.path
+        # fpath = zarr_obj.store.path
+        if isinstance(zarr_obj.store, zarr.storage.ConsolidatedMetadataStore):
+            fpath = zarr_obj.store.store.path
+        else:
+            fpath = zarr_obj.store.path
         path = zarr_obj.path
         path = os.path.join(fpath, path)
         self.__built.setdefault(path, builder)
@@ -1271,12 +1305,19 @@ def __get_built(self, zarr_obj):
         :type zarr_obj: Zarr Group or Dataset
         :return: Builder in the self.__built cache or None
         """
-        fpath = zarr_obj.store.path
+
+        if isinstance(zarr_obj.store, zarr.storage.ConsolidatedMetadataStore):
+            fpath = zarr_obj.store.store.path
+        else:
+            fpath = zarr_obj.store.path
+
+        # fpath = zarr_obj.store.path
         path = zarr_obj.path
         path = os.path.join(fpath, path)
         return self.__built.get(path, None)
 
     def __read_group(self, zarr_obj, name=None):
+        # breakpoint()
         ret = self.__get_built(zarr_obj)
         if ret is not None:
             return ret
diff --git a/src/hdmf_zarr/backend2.py b/src/hdmf_zarr/backend2.py
new file mode 100644
index 00000000..505031ea
--- /dev/null
+++ b/src/hdmf_zarr/backend2.py
@@ -0,0 +1,1420 @@
+"""Module with the Zarr-based I/O-backend for HDMF"""
+# Python imports
+import os
+import warnings
+import numpy as np
+import tempfile
+import logging
+
+# Zarr imports
+import zarr
+from zarr.hierarchy import Group
+from zarr.core import Array
+from zarr.storage import (DirectoryStore,
+                          TempStore,
+                          NestedDirectoryStore)
+import numcodecs
+
+# HDMF-ZARR imports
+from .utils import (ZarrDataIO,
+                    ZarrReference,
+                    ZarrSpecWriter,
+                    ZarrSpecReader,
+                    ZarrIODataChunkIteratorQueue)
+from .zarr_utils import BuilderZarrReferenceDataset, BuilderZarrTableDataset
+
+# HDMF imports
+from hdmf.backends.io import HDMFIO
+from hdmf.backends.errors import UnsupportedOperation
+from hdmf.backends.utils import (NamespaceToBuilderHelper,
+                                 WriteStatusTracker)
+from hdmf.utils import (docval,
+                        getargs,
+                        popargs,
+                        get_docval,
+                        get_data_shape)
+from hdmf.build import (Builder,
+                        GroupBuilder,
+                        DatasetBuilder,
+                        LinkBuilder,
+                        BuildManager,
+                        RegionBuilder,
+                        ReferenceBuilder,
+                        TypeMap)
+from hdmf.data_utils import AbstractDataChunkIterator
+from hdmf.spec import (RefSpec,
+                       DtypeSpec,
+                       NamespaceCatalog)
+from hdmf.query import HDMFDataset
+from hdmf.container import Container
+
+# Module variables
+ROOT_NAME = 'root'
+"""
+Name of the root builder for read/write
+"""
+
+SPEC_LOC_ATTR = '.specloc'
+"""
+Reserved attribute storing the path to the Group where the schema for the file are cached
+"""
+
+DEFAULT_SPEC_LOC_DIR = 'specifications'
+"""
+Default name of the group where specifications should be cached
+"""
+
+SUPPORTED_ZARR_STORES = (DirectoryStore,
+                         TempStore,
+                         NestedDirectoryStore)
+"""
+Tuple listing all Zarr storage backends supported by ZarrIO
+"""
+
+
+class ZarrIO(HDMFIO):
+
+    @staticmethod
+    def can_read(path):
+        try:
+            # TODO: how to use storage_options? Maybe easier to just check for ".zarr" suffix
+            zarr.open(path, mode="r")
+            self.__open_file_consolidated(source=path, mode='r')
+            return True
+        except Exception:
+            return False
+
+    @docval({'name': 'path',
+             'type': (str, *SUPPORTED_ZARR_STORES),
+             'doc': 'the path to the Zarr file or a supported Zarr store'},
+            {'name': 'manager', 'type': BuildManager, 'doc': 'the BuildManager to use for I/O', 'default': None},
+            {'name': 'mode', 'type': str,
+             'doc': 'the mode to open the Zarr file with, one of ("w", "r", "r+", "a", "w-")'},
+            {'name': 'synchronizer', 'type': (zarr.ProcessSynchronizer, zarr.ThreadSynchronizer, bool),
+             'doc': 'Zarr synchronizer to use for parallel I/O. If set to True a ProcessSynchronizer is used.',
+             'default': None},
+            {'name': 'object_codec_class', 'type': None,
+             'doc': 'Set the numcodec object codec class to be used to encode objects.'
+                    'Use numcodecs.pickles.Pickle by default.',
+             'default': None},
+            {'name': 'storage_options', 'type': dict,
+             'doc': 'Zarr storage options to read remote folders',
+             'default': None})
+    def __init__(self, **kwargs):
+        self.logger = logging.getLogger('%s.%s' % (self.__class__.__module__, self.__class__.__qualname__))
+        path, manager, mode, synchronizer, object_codec_class, storage_options = popargs(
+            'path', 'manager', 'mode', 'synchronizer', 'object_codec_class', 'storage_options', kwargs)
+        if manager is None:
+            manager = BuildManager(TypeMap(NamespaceCatalog()))
+        if isinstance(synchronizer, bool):
+            if synchronizer:
+                sync_path = tempfile.mkdtemp()
+                self.__synchronizer = zarr.ProcessSynchronizer(sync_path)
+            else:
+                self.__synchronizer = None
+        else:
+            self.__synchronizer = synchronizer
+        self.__mode = mode
+        self.__path = path
+        self.__file = None
+        self.__storage_options = storage_options
+        self.__built = dict()
+        self._written_builders = WriteStatusTracker()  # track which builders were written (or read) by this IO object
+        self.__dci_queue = None  # Will be initialized on call to io.write
+        # Codec class to be used. Alternates, e.g., =numcodecs.JSON
+        self.__codec_cls = numcodecs.pickles.Pickle if object_codec_class is None else object_codec_class
+        source_path = self.__path
+        if isinstance(self.__path, SUPPORTED_ZARR_STORES):
+            source_path = self.__path.path
+        super().__init__(manager, source=source_path)
+
+    @property
+    def file(self):
+        """
+        The Zarr zarr.hierarchy.Group (or zarr.core.Array) opened by the backend.
+        May be None in case open has not been called yet, e.g., if no data has been
+        read or written yet via this instance.
+        """
+        return self.__file
+
+    @property
+    def path(self):
+        """The path to the Zarr file as set by the user"""
+        return self.__path
+
+    @property
+    def abspath(self):
+        """The absolute path to the Zarr file"""
+        return os.path.abspath(self.source)
+
+    @property
+    def synchronizer(self):
+        return self.__synchronizer
+
+    @property
+    def object_codec_class(self):
+        return self.__codec_cls
+
+    def open(self):
+        """Open the Zarr file"""
+        if self.__file is None:
+            self.__file = self.__open_file_consolidated(store=self.path,
+                                                        mode=self.__mode,
+                                                        synchronizer=self.__synchronizer,
+                                                        storage_options=self.__storage_options)
+
+    def close(self):
+        """Close the Zarr file"""
+        self.__file = None
+        return
+
+    def is_remote(self):
+        """Return True if the file is remote, False otherwise"""
+        from zarr.storage import FSStore
+        if isinstance(self.file.store, FSStore):
+            return True
+        else:
+            return False
+
+    @classmethod
+    @docval({'name': 'namespace_catalog',
+             'type': (NamespaceCatalog, TypeMap),
+             'doc': 'the NamespaceCatalog or TypeMap to load namespaces into'},
+            {'name': 'path',
+             'type': (str, *SUPPORTED_ZARR_STORES),
+             'doc': 'the path to the Zarr file or a supported Zarr store'},
+            {'name': 'namespaces', 'type': list, 'doc': 'the namespaces to load', 'default': None})
+    def load_namespaces(cls, namespace_catalog, path, namespaces=None):
+        '''
+        Load cached namespaces from a file.
+        '''
+        # TODO: how to use storage_options here?
+        # f = self.__open_file_consolidated(source=path, mode='r')
+        f = zarr.open(path, mode='r')
+        if SPEC_LOC_ATTR not in f.attrs:
+            msg = "No cached namespaces found in %s" % path
+            warnings.warn(msg)
+        else:
+            spec_group = f[f.attrs[SPEC_LOC_ATTR]]
+            if namespaces is None:
+                namespaces = list(spec_group.keys())
+            for ns in namespaces:
+                ns_group = spec_group[ns]
+                latest_version = list(ns_group.keys())[-1]
+                ns_group = ns_group[latest_version]
+                reader = ZarrSpecReader(ns_group)
+                namespace_catalog.load_namespaces('namespace', reader=reader)
+
+    @docval(
+        {'name': 'container', 'type': Container, 'doc': 'the Container object to write'},
+        {'name': 'cache_spec', 'type': bool, 'doc': 'cache specification to file', 'default': True},
+        {'name': 'link_data', 'type': bool,
+         'doc': 'If not specified otherwise link (True) or copy (False) Datasets', 'default': True},
+        {'name': 'exhaust_dci', 'type': bool,
+         'doc': 'exhaust DataChunkIterators one at a time. If False, add ' +
+                'them to the internal queue self.__dci_queue and exhaust them concurrently at the end',
+         'default': True},
+        {
+            "name": "number_of_jobs",
+            "type": int,
+            "doc": (
+                "Number of jobs to use in parallel during write "
+                "(only works with GenericDataChunkIterator-wrapped datasets)."
+            ),
+            "default": 1,
+        },
+        {
+            "name": "max_threads_per_process",
+            "type": int,
+            "doc": (
+                "Limits the number of threads used by each process. The default is None (no limits)."
+            ),
+            "default": None,
+        },
+        {
+            "name": "multiprocessing_context",
+            "type": str,
+            "doc": (
+                "Context for multiprocessing. It can be None (default), 'fork' or 'spawn'. "
+                "Note that 'fork' is only available on UNIX systems (not Windows)."
+            ),
+            "default": None,
+        },
+    )
+    def write(self, **kwargs):
+        """Overwrite the write method to add support for caching the specification and parallelization."""
+        cache_spec, number_of_jobs, max_threads_per_process, multiprocessing_context = popargs(
+            "cache_spec", "number_of_jobs", "max_threads_per_process", "multiprocessing_context", kwargs
+        )
+
+        self.__dci_queue = ZarrIODataChunkIteratorQueue(
+            number_of_jobs=number_of_jobs,
+            max_threads_per_process=max_threads_per_process,
+            multiprocessing_context=multiprocessing_context,
+        )
+
+        super(ZarrIO, self).write(**kwargs)
+        if cache_spec:
+            self.__cache_spec()
+
+    def __cache_spec(self):
+        """Interanl function used to cache the spec in the current file"""
+        ref = self.__file.attrs.get(SPEC_LOC_ATTR)
+        spec_group = None
+        if ref is not None:
+            spec_group = self.__file[ref]
+        else:
+            path = DEFAULT_SPEC_LOC_DIR  # do something to figure out where the specifications should go
+            spec_group = self.__file.require_group(path)
+            self.__file.attrs[SPEC_LOC_ATTR] = path
+        ns_catalog = self.manager.namespace_catalog
+        for ns_name in ns_catalog.namespaces:
+            ns_builder = NamespaceToBuilderHelper.convert_namespace(ns_catalog, ns_name)
+            namespace = ns_catalog.get_namespace(ns_name)
+            if namespace.version is None:
+                group_name = '%s/unversioned' % ns_name
+            else:
+                group_name = '%s/%s' % (ns_name, namespace.version)
+            ns_group = spec_group.require_group(group_name)
+            writer = ZarrSpecWriter(ns_group)
+            ns_builder.export('namespace', writer=writer)
+
+    @docval(
+        *get_docval(HDMFIO.export),
+        {'name': 'cache_spec', 'type': bool, 'doc': 'whether to cache the specification to file', 'default': True},
+        {
+            "name": "number_of_jobs",
+            "type": int,
+            "doc": (
+                "Number of jobs to use in parallel during write "
+                "(only works with GenericDataChunkIterator-wrapped datasets)."
+            ),
+            "default": 1,
+        },
+        {
+            "name": "max_threads_per_process",
+            "type": int,
+            "doc": (
+                "Limits the number of threads used by each process. The default is None (no limits)."
+            ),
+            "default": None,
+        },
+        {
+            "name": "multiprocessing_context",
+            "type": str,
+            "doc": (
+                "Context for multiprocessing. It can be None (default), 'fork' or 'spawn'. "
+                "Note that 'fork' is only available on UNIX systems (not Windows)."
+            ),
+            "default": None,
+        },
+    )
+    def export(self, **kwargs):
+        """Export data read from a file from any backend to Zarr.
+        See :py:meth:`hdmf.backends.io.HDMFIO.export` for more details.
+        """
+        if self.__mode != 'w':
+            raise UnsupportedOperation("Cannot export to file %s in mode '%s'. Please use mode 'w'."
+                                       % (self.source, self.__mode))
+
+        src_io = getargs('src_io', kwargs)
+        write_args, cache_spec = popargs('write_args', 'cache_spec', kwargs)
+        number_of_jobs, max_threads_per_process, multiprocessing_context = popargs(
+            "number_of_jobs", "max_threads_per_process", "multiprocessing_context", kwargs
+        )
+
+        self.__dci_queue = ZarrIODataChunkIteratorQueue(
+            number_of_jobs=number_of_jobs,
+            max_threads_per_process=max_threads_per_process,
+            multiprocessing_context=multiprocessing_context,
+        )
+
+        if not isinstance(src_io, ZarrIO) and write_args.get('link_data', True):
+            raise UnsupportedOperation("Cannot export from non-Zarr backend %s to Zarr with write argument "
+                                       "link_data=True." % src_io.__class__.__name__)
+
+        write_args['export_source'] = src_io.source  # pass export_source=src_io.source to write_builder
+        ckwargs = kwargs.copy()
+        ckwargs['write_args'] = write_args
+        super().export(**ckwargs)
+        if cache_spec:
+            self.__cache_spec()
+
+    def get_written(self, builder, check_on_disk=False):
+        """
+        Return True if this builder has been written to (or read from) disk by this IO object, False otherwise.
+
+        :param builder: Builder object to get the written flag for
+        :type builder: Builder
+        :param check_on_disk: Check that the builder has been physically written to disk not just flagged as written
+                              by this I/O backend
+        :type check_on_disk: bool
+        :return: True if the builder is found in self._written_builders using the builder ID, False otherwise. If
+                 check_on_disk is enabled then the function cals get_builder_exists_on_disk in addtion to verify
+                 that the builder has indeed been written to disk.
+        """
+        written = self._written_builders.get_written(builder)
+        if written and check_on_disk:
+            written = written and self.get_builder_exists_on_disk(builder=builder)
+        return written
+
+    @docval({'name': 'builder', 'type': Builder, 'doc': 'The builder of interest'})
+    def get_builder_exists_on_disk(self, **kwargs):
+        """
+        Convenience function to check whether a given builder exists on disk in this Zarr file.
+        """
+        builder = getargs('builder', kwargs)
+        builder_path = self.get_builder_disk_path(builder=builder, filepath=None)
+        exists_on_disk = os.path.exists(builder_path)
+        return exists_on_disk
+
+    @docval({'name': 'builder', 'type': Builder, 'doc': 'The builder of interest'},
+            {'name': 'filepath', 'type': str,
+             'doc': 'The path to the Zarr file or None for this file', 'default': None})
+    def get_builder_disk_path(self, **kwargs):
+        builder, filepath = getargs('builder', 'filepath', kwargs)
+        basepath = filepath if filepath is not None else self.source
+        builder_path = os.path.join(basepath, self.__get_path(builder).lstrip("/"))
+        return builder_path
+
+    @docval(
+        {'name': 'builder', 'type': GroupBuilder, 'doc': 'the GroupBuilder object representing the NWBFile'},
+        {
+            'name': 'link_data',
+            'type': bool,
+            'doc': 'If not specified otherwise link (True) or copy (False) Zarr Datasets',
+            'default': True
+        },
+        {
+            'name': 'exhaust_dci',
+            'type': bool,
+            'doc': (
+                'Exhaust DataChunkIterators one at a time. If False, add '
+                'them to the internal queue self.__dci_queue and exhaust them concurrently at the end'
+            ),
+            'default': True,
+        },
+        {
+            'name': 'export_source',
+            'type': str,
+            'doc': 'The source of the builders when exporting',
+            'default': None,
+        },
+    )
+    def write_builder(self, **kwargs):
+        """Write a builder to disk."""
+        f_builder, link_data, exhaust_dci, export_source = getargs(
+            'builder', 'link_data', 'exhaust_dci', 'export_source', kwargs
+        )
+        for name, gbldr in f_builder.groups.items():
+            self.write_group(
+                parent=self.__file,
+                builder=gbldr,
+                link_data=link_data,
+                exhaust_dci=exhaust_dci,
+                export_source=export_source,
+            )
+        for name, dbldr in f_builder.datasets.items():
+            self.write_dataset(
+                parent=self.__file,
+                builder=dbldr,
+                link_data=link_data,
+                exhaust_dci=exhaust_dci,
+                export_source=export_source,
+            )
+        self.write_attributes(self.__file, f_builder.attributes)  # the same as set_attributes in HDMF
+        self.__dci_queue.exhaust_queue()  # Write any remaining DataChunkIterators that have been queued
+        self._written_builders.set_written(f_builder)
+        self.logger.debug("Done writing %s '%s' to path '%s'" %
+                          (f_builder.__class__.__qualname__, f_builder.name, self.source))
+
+        # Consolidate metadata for the entire file after everything has been written
+        zarr.consolidate_metadata(self.__file, metadata_key='.zmetadata')
+
+    def consolidate_metadata(self):
+        """
+        When a file is written, the metadata within the file is consolidated automatically.
+        If there are any metadata changes, the user needs to consolidate the metadata again
+        with this method in order for the metadata to be read correctly.
+
+        Consolidate all metadata for groups and arrays within the given store into a
+        single resource and put it under .zmetadata.
+        """
+        zarr.consolidate_metadata(self.__path, metadata_key='.zmetadata')
+
+    def __open_file_consolidated(self,
+                                 store,
+                                 mode,
+                                 synchronizer = None,
+                                 storage_options = None):
+        """
+        This method will check to see if the metadata has been consolidated, if so
+        """
+
+        if os.path.isfile(self.__path+'/.zmetadata'):
+            zarr.open_consolidated(store=store,
+                                   mode=mode,
+                                   synchronizer=synchronizer,
+                                   storage_options=storage_options)
+        else:
+            msg = "Could not find consolidated metadata."
+            warnings.warn(msg)
+
+            zarr.open(store=store,
+                      mode=mode,
+                      synchronizer=synchronizer,
+                      storage_options=storage_options)
+
+    @docval({'name': 'parent', 'type': Group, 'doc': 'the parent Zarr object'},
+            {'name': 'builder', 'type': GroupBuilder, 'doc': 'the GroupBuilder to write'},
+            {'name': 'link_data', 'type': bool,
+             'doc': 'If not specified otherwise link (True) or copy (False) Zarr Datasets', 'default': True},
+            {'name': 'exhaust_dci', 'type': bool,
+             'doc': 'exhaust DataChunkIterators one at a time. If False, add ' +
+                    'them to the internal queue self.__dci_queue and exhaust them concurrently at the end',
+             'default': True},
+            {'name': 'export_source', 'type': str,
+             'doc': 'The source of the builders when exporting', 'default': None},
+            returns='the Group that was created', rtype='Group')
+    def write_group(self, **kwargs):
+        """Write a GroupBuider to file"""
+        parent, builder, link_data, exhaust_dci, export_source = getargs(
+            'parent', 'builder', 'link_data', 'exhaust_dci', 'export_source', kwargs
+        )
+
+        if self.get_written(builder):
+            group = parent[builder.name]
+        else:
+            group = parent.require_group(builder.name)
+
+        subgroups = builder.groups
+        if subgroups:
+            for subgroup_name, sub_builder in subgroups.items():
+                self.write_group(
+                    parent=group,
+                    builder=sub_builder,
+                    link_data=link_data,
+                    exhaust_dci=exhaust_dci,
+                )
+
+        datasets = builder.datasets
+        if datasets:
+            for dset_name, sub_builder in datasets.items():
+                self.write_dataset(
+                    parent=group,
+                    builder=sub_builder,
+                    link_data=link_data,
+                    exhaust_dci=exhaust_dci,
+                    export_source=export_source,
+                )
+
+        # write all links (haven implemented)
+        links = builder.links
+        if links:
+            for link_name, sub_builder in links.items():
+                self.write_link(group, sub_builder)
+
+        attributes = builder.attributes
+        self.write_attributes(group, attributes)
+        self._written_builders.set_written(builder)  # record that the builder has been written
+        return group
+
+    @docval({'name': 'obj', 'type': (Group, Array), 'doc': 'the Zarr object to add attributes to'},
+            {'name': 'attributes',
+             'type': dict,
+             'doc': 'a dict containing the attributes on the Group or Dataset, indexed by attribute name'},
+            {'name': 'export_source', 'type': str,
+             'doc': 'The source of the builders when exporting', 'default': None})
+    def write_attributes(self, **kwargs):
+        """Set (i.e., write) the attributes on a given Zarr Group or Array."""
+        obj, attributes, export_source = getargs('obj', 'attributes', 'export_source', kwargs)
+
+        for key, value in attributes.items():
+            # Case 1: list, set, tuple type attributes
+            if isinstance(value, (set, list, tuple)) or (isinstance(value, np.ndarray) and np.ndim(value) != 0):
+                # Convert to tuple for writing (e.g., numpy arrays are not JSON serializable)
+                if isinstance(value, np.ndarray):
+                    tmp = tuple(value.tolist())
+                else:
+                    tmp = tuple(value)
+                # Attempt write of the attribute
+                try:
+                    obj.attrs[key] = tmp
+                # Numpy scalars and bytes are not JSON serializable. Try to convert to a serializable type instead
+                except TypeError as e:
+                    try:
+                        tmp = tuple([i.item()
+                                     if (isinstance(i, np.generic) and not isinstance(i, np.bytes_))
+                                     else i.decode("utf-8")
+                                     if isinstance(i, (bytes, np.bytes_))
+                                     else i
+                                     for i in value])
+                        obj.attrs[key] = tmp
+                    except:  # noqa: E722
+                        raise TypeError(str(e) + " type=" + str(type(value)) + "  data=" + str(value)) from e
+            # Case 2: References
+            elif isinstance(value, (Container, Builder, ReferenceBuilder)):
+                # TODO: Region References are not yet supported
+                # if isinstance(value, RegionBuilder):
+                #     type_str = 'region'
+                #     refs = self.__get_ref(value.builder)
+                if isinstance(value, (ReferenceBuilder, Container, Builder)):
+                    type_str = 'object'
+                    if isinstance(value, Builder):
+                        refs = self.__get_ref(value, export_source)
+                    else:
+                        refs = self.__get_ref(value.builder, export_source)
+                tmp = {'zarr_dtype': type_str, 'value': refs}
+                obj.attrs[key] = tmp
+            # Case 3: Scalar attributes
+            else:
+                # Attempt to write the attribute
+                try:
+                    obj.attrs[key] = value
+                # Numpy scalars and bytes are not JSON serializable. Try to convert to a serializable type instead
+                except TypeError as e:
+                    try:
+                        val = value.item if isinstance(value, np.ndarray) else value
+                        val = value.item() \
+                            if (isinstance(value, np.generic) and not isinstance(value, np.bytes_)) \
+                            else val.decode("utf-8") \
+                            if isinstance(value, (bytes, np.bytes_)) \
+                            else val
+                        obj.attrs[key] = val
+                    except:  # noqa: E722
+                        msg = str(e) + "key=" + key + " type=" + str(type(value)) + "  data=" + str(value)
+                        raise TypeError(msg) from e
+
+    def __get_path(self, builder):
+        """Get the path to the builder.
+        If builder.location is set then it is used as the path, otherwise the function
+        determines the path by constructing it iteratively from the parents of the
+        builder.
+        """
+        if builder.location is not None:
+            path = os.path.normpath(os.path.join(builder.location, builder.name)).replace("\\", "/")
+        else:
+            curr = builder
+            names = list()
+            while curr is not None and curr.name != ROOT_NAME:
+                names.append(curr.name)
+                curr = curr.parent
+            delim = "/"
+            path = "%s%s" % (delim, delim.join(reversed(names)))
+        return path
+
+    @staticmethod
+    def get_zarr_paths(zarr_object):
+        """
+        For a Zarr object find 1) the path to the main zarr file it is in and 2) the path to the object within the file
+        :param zarr_object: Object for which we are looking up the path
+        :type zarr_object: Zarr Group or Array
+        :return: Tuple of two string with: 1) path of the Zarr file and 2) full path within the zarr file to the object
+        """
+        # In Zarr the path is a combination of the path of the store and the path of the object. So we first need to
+        # merge those two paths, then remove the path of the file, add the missing leading "/" and then compute the
+        # directory name to get the path of the parent
+        fullpath = os.path.normpath(os.path.join(zarr_object.store.path, zarr_object.path)).replace("\\", "/")
+        # To determine the filepath we now iterate over the path and check if the .zgroup object exists at
+        # a level, indicating that we are still within the Zarr file. The first level we hit where the parent
+        # directory does not have a .zgroup means we have found the main file
+        filepath = fullpath
+        while os.path.exists(os.path.join(os.path.dirname(filepath), ".zgroup")):
+            filepath = os.path.dirname(filepath)
+        # From the fullpath and filepath we can now compute the objectpath within the zarr file as the relative
+        # path from the filepath to the object
+        objectpath = "/" + os.path.relpath(fullpath, filepath)
+        # return the result
+        return filepath, objectpath
+
+    @staticmethod
+    def get_zarr_parent_path(zarr_object):
+        """
+        Get the location of the parent of a zarr_object within the file
+        :param zarr_object: Object for which we are looking up the path
+        :type zarr_object: Zarr Group or Array
+        :return: String with the path
+        """
+        filepath, objectpath = ZarrIO.get_zarr_paths(zarr_object)
+        parentpath = os.path.dirname(objectpath)
+        return parentpath
+
+    @staticmethod
+    def is_zarr_file(path):
+        """
+        Check if the given path defines a Zarr file
+        :param path: Full path to main directory
+        :return: Bool
+        """
+        if os.path.exists(path):
+            if os.path.isdir(path):
+                if os.path.exists(os.path.join(path, ".zgroup")):
+                    return True
+        return False
+
+    def __is_ref(self, dtype):
+        if isinstance(dtype, DtypeSpec):
+            return self.__is_ref(dtype.dtype)
+        elif isinstance(dtype, RefSpec):
+            return True
+        elif isinstance(dtype, np.dtype):
+            return False
+        else:
+            return dtype == DatasetBuilder.OBJECT_REF_TYPE or dtype == DatasetBuilder.REGION_REF_TYPE
+
+    def resolve_ref(self, zarr_ref):
+        """
+        Get the full path to the object linked to by the zarr reference
+
+        The function only constructs the links to the targe object, but it does not check if the object exists
+
+        :param zarr_ref: Dict with `source` and `path` keys or a `ZarrReference` object
+        :return: 1) name of the target object
+                 2) the target zarr object within the target file
+        """
+        # Extract the path as defined in the zarr_ref object
+        if zarr_ref.get('source', None) is None:
+            source_file = str(zarr_ref['path'])
+        else:
+            source_file = str(zarr_ref['source'])
+        # Resolve the path relative to the current file
+        if not self.is_remote():
+            source_file = os.path.abspath(os.path.join(self.source, source_file))
+        else:
+            # get rid of extra "/" and "./" in the path root and source_file
+            root_path = str(self.path).rstrip("/")
+            source_path = str(source_file).lstrip(".")
+            source_file = root_path + source_path
+
+        object_path = zarr_ref.get('path', None)
+        if object_path:
+            target_name = os.path.basename(object_path)
+        else:
+            target_name = ROOT_NAME
+
+        target_zarr_obj = zarr.open(source_file, mode='r', storage_options=self.__storage_options)
+        # target_zarr_obj = self.__open_file_consolidated(store=source_file, mode='r', storage_options=self.__storage_options)
+        if object_path is not None:
+            try:
+                target_zarr_obj = target_zarr_obj[object_path]
+            except Exception:
+                raise ValueError("Found bad link to object %s in file %s" % (object_path, source_file))
+        # Return the create path
+        return target_name, target_zarr_obj
+
+    def __get_ref(self, ref_object, export_source=None):
+        """
+        Create a ZarrReference object that points to the given container
+
+        :param ref_object: the object to be referenced
+        :type ref_object: Builder, Container, ReferenceBuilder
+        :returns: ZarrReference object
+        """
+        if isinstance(ref_object, RegionBuilder):  # or region is not None: TODO: Add to support regions
+            raise NotImplementedError("Region references are currently not supported by ZarrIO")
+        if isinstance(ref_object, Builder):
+            if isinstance(ref_object, LinkBuilder):
+                builder = ref_object.target_builder
+            else:
+                builder = ref_object
+        elif isinstance(ref_object, ReferenceBuilder):
+            builder = ref_object.builder
+        else:
+            builder = self.manager.build(ref_object)
+        path = self.__get_path(builder)
+        # TODO Add to get region for region references.
+        #      Also add  {'name': 'region', 'type': (slice, list, tuple),
+        #      'doc': 'the region reference indexing object',  'default': None},
+        # if isinstance(ref_object, RegionBuilder):
+        #    region = ref_object.region
+
+        # get the object id if available
+        object_id = builder.get('object_id', None)
+
+        # determine the object_id of the source by following the parents of the builder until we find the root
+        # the root builder should be the same as the source file containing the reference
+        curr = builder
+        while curr is not None and curr.name != ROOT_NAME:
+            curr = curr.parent
+        if curr:
+            source_object_id = curr.get('object_id', None)
+        # We did not find ROOT_NAME as a parent. This should only happen if we have an invalid
+        # file as a source, e.g., if during testing we use an arbitrary builder. We check this
+        # anyways to avoid potential errors just in case
+        else:
+            source_object_id = None
+            warn_msg = "Could not determine source_object_id for builder with path: %s" % path
+            warnings.warn(warn_msg)
+
+        # by checking os.isdir makes sure we have a valid link path to a dir for Zarr. For conversion
+        # between backends a user should always use export which takes care of creating a clean set of builders.
+        source = (builder.source
+                  if (builder.source is not None and os.path.isdir(builder.source))
+                  else self.source)
+
+        # Make the source relative to the current file
+        # TODO: This check assumes that all links are internal links on export.
+        # Need to deal with external links on export.
+        if export_source is not None:
+            # Make sure the source of the reference is now towards the new file
+            # and not the original source when exporting.
+            source = '.'
+        else:
+            source = os.path.relpath(os.path.abspath(source), start=self.abspath)
+        # Return the ZarrReference object
+        ref = ZarrReference(
+            source=source,
+            path=path,
+            object_id=object_id,
+            source_object_id=source_object_id)
+        return ref
+
+    def __add_link__(self, parent, target_source, target_path, link_name):
+        """
+        Add a link to the file
+        :param parent: The parent Zarr group containing the link
+        :type parent: zarr.hierarchy.Group
+        :param target_source: Source path within the Zarr file to the linked object
+        :type target_source: str
+        :param target_path: Path to the Zarr file containing the linked object
+        :param link_name: Name of the link
+        :type link_name: str
+        """
+        if 'zarr_link' not in parent.attrs:
+            parent.attrs['zarr_link'] = []
+        zarr_link = list(parent.attrs['zarr_link'])
+        zarr_link.append({'source': target_source, 'path': target_path, 'name': link_name})
+        parent.attrs['zarr_link'] = zarr_link
+
+    @docval({'name': 'parent', 'type': Group, 'doc': 'the parent Zarr object'},
+            {'name': 'builder', 'type': LinkBuilder, 'doc': 'the LinkBuilder to write'})
+    def write_link(self, **kwargs):
+        parent, builder = getargs('parent', 'builder', kwargs)
+        if self.get_written(builder):
+            self.logger.debug("Skipping LinkBuilder '%s' already written to parent group '%s'"
+                              % (builder.name, parent.name))
+            return
+        self.logger.debug("Writing LinkBuilder '%s' to parent group '%s'" % (builder.name, parent.name))
+        name = builder.name
+        target_builder = builder.builder
+        # Get the reference
+        zarr_ref = self.__get_ref(target_builder)
+        # EXPORT WITH LINKS: Fix link source
+        # if the target and source are both the same, then we need to ALWAYS use ourselves as a source
+        # When exporting from one source to another, the LinkBuilders.source are not updated, i.e,. the
+        # builder.source and target_builder.source are not being updated and point to the old file, but
+        # for internal links (a.k.a, SoftLinks) they will be the same and our target will be part of
+        # our new file, so we can safely replace the source
+        if builder.source == target_builder.source:
+            zarr_ref.source = "."  # Link should be relative to self
+        # EXPORT WITH LINKS: Make sure target is written. If is not then if the target points to a
+        #                    non-Zarr source, then we need to copy the data instead of writing a
+        #                    link to the data
+        # When exporting from a different backend, then we may encounter external links to
+        # other datasets, groups (or links) in another file. Since they are from another
+        # backend, we must ensure that those targets are copied as well, so we check here
+        # if our target_builder has been written and write it if it doesn't
+        # TODO: Review the logic for when we need to copy data and when to link it. We may need the export_source?
+        """
+        skip_link = False
+        if not self.get_written(target_builder):
+            if not self.is_zarr_file(target_builder.source):
+                # We need to copy the target in place of the link so we need to
+                # change the name of target_builder to match the link instead
+                temp = copy(target_builder.name)
+                target_builder._Builder__name = name
+                # Skip writing the link since we copied the data into place
+                skip_link = True
+                if isinstance(target_builder, DatasetBuilder):
+                    self.write_dataset(parent=parent, builder=target_builder)
+                elif isinstance(target_builder, GroupBuilder):
+                    self.write_group(parent=parent, builder=target_builder)
+                elif isinstance(target_builder, LinkBuilder):
+                    self.write_link(parent=parent, builder=target_builder)
+                target_builder._Builder__name = temp
+        # REGULAR LINK I/O:
+        # Write the actual link as we should in most cases. Skip it only if we copied the
+        # data from an external source in place instead
+        if not skip_link:
+            self.__add_link__(parent, zarr_ref.source, zarr_ref.path, name)
+        """
+        self.__add_link__(parent, zarr_ref.source, zarr_ref.path, name)
+        self._written_builders.set_written(builder)  # record that the builder has been written
+
+    @classmethod
+    def __setup_chunked_dataset__(cls, parent, name, data, options=None):
+        """
+        Setup a dataset for writing to one-chunk-at-a-time based on the given DataChunkIterator. This
+        is a helper function for write_dataset()
+        :param parent: The parent object to which the dataset should be added
+        :type parent: Zarr Group or File
+        :param name: The name of the dataset
+        :type name: str
+        :param data: The data to be written.
+        :type data: AbstractDataChunkIterator
+        :param options: Dict with options for creating a dataset. available options are 'dtype' and 'io_settings'
+        :type options: dict
+        """
+        io_settings = {}
+        if options is not None:
+            if 'io_settings' in options:
+                io_settings = options.get('io_settings')
+        # Define the chunking options if the user has not set them explicitly. We need chunking for the iterative write.
+        if 'chunks' not in io_settings:
+            recommended_chunks = data.recommended_chunk_shape()
+            io_settings['chunks'] = True if recommended_chunks is None else recommended_chunks
+        # Define the shape of the data if not provided by the user
+        if 'shape' not in io_settings:
+            io_settings['shape'] = data.recommended_data_shape()
+        if 'dtype' not in io_settings:
+            if (options is not None) and ('dtype' in options):
+                io_settings['dtype'] = options['dtype']
+            else:
+                io_settings['dtype'] = data.dtype
+            if isinstance(io_settings['dtype'], str):
+                # map to real dtype if we were given a string
+                io_settings['dtype'] = cls.__dtypes.get(io_settings['dtype'])
+        try:
+            dset = parent.create_dataset(name, **io_settings)
+            dset.attrs['zarr_dtype'] = np.dtype(io_settings['dtype']).str
+        except Exception as exc:
+            raise Exception("Could not create dataset %s in %s" % (name, parent.name)) from exc
+        return dset
+
+    @docval({'name': 'parent', 'type': Group, 'doc': 'the parent Zarr object'},  # noqa: C901
+            {'name': 'builder', 'type': DatasetBuilder, 'doc': 'the DatasetBuilder to write'},
+            {'name': 'link_data', 'type': bool,
+             'doc': 'If not specified otherwise link (True) or copy (False) Zarr Datasets', 'default': True},
+            {'name': 'exhaust_dci', 'type': bool,
+             'doc': 'exhaust DataChunkIterators one at a time. If False, add ' +
+                    'them to the internal queue self.__dci_queue and exhaust them concurrently at the end',
+             'default': True},
+            {'name': 'force_data', 'type': None,
+             'doc': 'Used internally to force the data being used when we have to load the data', 'default': None},
+            {'name': 'export_source', 'type': str,
+             'doc': 'The source of the builders when exporting', 'default': None},
+            returns='the Zarr array that was created', rtype=Array)
+    def write_dataset(self, **kwargs):  # noqa: C901
+        parent, builder, link_data, exhaust_dci, export_source = getargs(
+            'parent', 'builder', 'link_data', 'exhaust_dci', 'export_source', kwargs
+        )
+
+        force_data = getargs('force_data', kwargs)
+
+        if exhaust_dci and self.__dci_queue is None:
+            self.__dci_queue = ZarrIODataChunkIteratorQueue()
+
+        if self.get_written(builder):
+            return None
+        name = builder.name
+        data = builder.data if force_data is None else force_data
+        options = dict()
+        if isinstance(data, ZarrDataIO):
+            options['io_settings'] = data.io_settings
+            link_data = data.link_data
+            data = data.data
+        else:
+            options['io_settings'] = {}
+
+        attributes = builder.attributes
+        options['dtype'] = builder.dtype
+
+        linked = False
+
+        # Write a regular Zarr array
+        dset = None
+        if isinstance(data, Array):
+            # copy the dataset
+            if link_data:
+                self.__add_link__(parent, data.store.path, data.name, name)
+                linked = True
+                dset = None
+            else:
+                zarr.copy(data, parent, name=name)
+                dset = parent[name]
+        # When converting data between backends we may see an HDMFDataset, e.g., a H55ReferenceDataset, with references
+        elif isinstance(data, HDMFDataset):
+            # If we have a dataset of containers we need to make the references to the containers
+            if len(data) > 0 and isinstance(data[0], Container):
+                ref_data = [self.__get_ref(data[i], export_source=export_source) for i in range(len(data))]
+                shape = (len(data), )
+                type_str = 'object'
+                dset = parent.require_dataset(name,
+                                              shape=shape,
+                                              dtype=object,
+                                              object_codec=self.__codec_cls(),
+                                              **options['io_settings'])
+                dset.attrs['zarr_dtype'] = type_str
+                dset[:] = ref_data
+                self._written_builders.set_written(builder)  # record that the builder has been written
+            # If we have a regular dataset, then load the data and write the builder after load
+            else:
+                # TODO This code path is also exercised when data is a
+                # hdmf.backends.hdf5.h5_utils.BuilderH5ReferenceDataset (aka.  ReferenceResolver)
+                # check that this is indeed the right thing to do here
+
+                # We can/should not update the data in the builder itself so we load the data here and instead
+                # force write_dataset when we call it recursively to use the data we loaded, rather than the
+                # dataset that is set on the builder
+                dset = self.write_dataset(parent=parent,
+                                          builder=builder,
+                                          link_data=link_data,
+                                          force_data=data[:],
+                                          export_source=export_source)
+                self._written_builders.set_written(builder)  # record that the builder has been written
+        # Write a compound dataset
+        elif isinstance(options['dtype'], list):
+            refs = list()
+            type_str = list()
+            for i, dts in enumerate(options['dtype']):
+                if self.__is_ref(dts['dtype']):
+                    refs.append(i)
+                    ref_tmp = self.__get_ref(data[0][i], export_source=export_source)
+                    if isinstance(ref_tmp, ZarrReference):
+                        dts_str = 'object'
+                    else:
+                        dts_str = 'region'
+                    type_str.append({'name': dts['name'], 'dtype': dts_str})
+                else:
+                    i = list([dts, ])
+                    t = self.__resolve_dtype_helper__(i)
+                    type_str.append(self.__serial_dtype__(t)[0])
+
+            if len(refs) > 0:
+                dset = parent.require_dataset(name,
+                                              shape=(len(data), ),
+                                              dtype=object,
+                                              object_codec=self.__codec_cls(),
+                                              **options['io_settings'])
+                self._written_builders.set_written(builder)  # record that the builder has been written
+                dset.attrs['zarr_dtype'] = type_str
+                for j, item in enumerate(data):
+                    new_item = list(item)
+                    for i in refs:
+                        new_item[i] = self.__get_ref(item[i], export_source=export_source)
+                    dset[j] = new_item
+            else:
+                # write a compound datatype
+                dset = self.__list_fill__(parent, name, data, options)
+        # Write a dataset of references
+        elif self.__is_ref(options['dtype']):
+            # TODO Region references are not yet support, but here how the code should look
+            #  if isinstance(data, RegionBuilder):
+            #      shape = (1,)
+            #      type_str = 'region'
+            #      refs = self.__get_ref(data.builder, data.region)
+            if isinstance(data, ReferenceBuilder):
+                shape = (1,)
+                type_str = 'object'
+                refs = self.__get_ref(data.builder, export_source=export_source)
+            # TODO: Region References are not yet supported
+            # elif options['dtype'] == 'region':
+            #     shape = (len(data), )
+            #     type_str = 'region'
+            #     refs = [self.__get_ref(item.builder, item.region) for item in data]
+            else:
+                shape = (len(data), )
+                type_str = 'object'
+                refs = [self.__get_ref(item, export_source=export_source) for item in data]
+
+            dset = parent.require_dataset(name,
+                                          shape=shape,
+                                          dtype=object,
+                                          object_codec=self.__codec_cls(),
+                                          **options['io_settings'])
+            self._written_builders.set_written(builder)  # record that the builder has been written
+            dset.attrs['zarr_dtype'] = type_str
+            if hasattr(refs, '__len__'):
+                dset[:] = refs
+            else:
+                dset[0] = refs
+        # write a 'regular' dataset without DatasetIO info
+        else:
+            if isinstance(data, (str, bytes)):
+                dset = self.__scalar_fill__(parent, name, data, options)
+            # Iterative write of a data chunk iterator
+            elif isinstance(data, AbstractDataChunkIterator):
+                dset = self.__setup_chunked_dataset__(parent, name, data, options)
+                self.__dci_queue.append(dataset=dset, data=data)
+            elif hasattr(data, '__len__'):
+                dset = self.__list_fill__(parent, name, data, options)
+            else:
+                dset = self.__scalar_fill__(parent, name, data, options)
+        if not linked:
+            self.write_attributes(dset, attributes)
+        # record that the builder has been written
+        self._written_builders.set_written(builder)
+        # Exhaust the DataChunkIterator if the dataset was given this way. Note this is a no-op
+        # if the self.__dci_queue is empty
+        if exhaust_dci:
+            self.__dci_queue.exhaust_queue()
+        return dset
+
+    __dtypes = {
+        "float": np.float32,
+        "float32": np.float32,
+        "double": np.float64,
+        "float64": np.float64,
+        "long": np.int64,
+        "int64": np.int64,
+        "uint64": np.uint64,
+        "int": np.int32,
+        "int32": np.int32,
+        "int16": np.int16,
+        "int8": np.int8,
+        "bool": np.bool_,
+        "bool_": np.bool_,
+        "text": str,
+        "utf": str,
+        "utf8": str,
+        "utf-8": str,
+        "ascii": bytes,
+        "str": str,
+        "isodatetime": str,
+        "string_": bytes,
+        "uint32": np.uint32,
+        "uint16": np.uint16,
+        "uint8": np.uint8,
+        "ref": ZarrReference,
+        "reference": ZarrReference,
+        "object": ZarrReference,
+        "region": ZarrReference,
+    }
+
+    @classmethod
+    def __serial_dtype__(cls, dtype):
+        if isinstance(dtype, type):
+            return dtype.__name__
+        elif isinstance(dtype, np.dtype):
+            if dtype.names is None:
+                return dtype.type.__name__
+            else:
+                ret = list()
+                for n in dtype.names:
+                    item = dict()
+                    item['name'] = n
+                    item['dtype'] = cls.__serial_dtype__(dtype[n])
+                    ret.append(item)
+                return ret
+        # TODO Does not work when Reference in compound datatype
+        elif dtype == ZarrReference:
+            return 'object'
+
+    @classmethod
+    def __resolve_dtype__(cls, dtype, data):
+        dtype = cls.__resolve_dtype_helper__(dtype)
+        if dtype is None:
+            dtype = cls.get_type(data)
+        return dtype
+
+    @classmethod
+    def __resolve_dtype_helper__(cls, dtype):
+        if dtype is None:
+            return None
+        elif isinstance(dtype, (type, np.dtype)):
+            return dtype
+        elif isinstance(dtype, str):
+            return cls.__dtypes.get(dtype)
+        elif isinstance(dtype, dict):
+            return cls.__dtypes.get(dtype['reftype'])
+        else:
+            return np.dtype([(x['name'], cls.__resolve_dtype_helper__(x['dtype'])) for x in dtype])
+
+    @classmethod
+    def get_type(cls, data):
+        if isinstance(data, str):
+            return str
+        elif not hasattr(data, '__len__'):
+            return type(data)
+        else:
+            if len(data) == 0:
+                raise ValueError('cannot determine type for empty data')
+            return cls.get_type(data[0])
+
+    __reserve_attribute = ('zarr_dtype', 'zarr_link')
+
+    def __list_fill__(self, parent, name, data, options=None):  # noqa: C901
+        dtype = None
+        io_settings = dict()
+        if options is not None:
+            dtype = options.get('dtype')
+            io_settings = options.get('io_settings')
+            if io_settings is None:
+                io_settings = dict()
+        # Determine the dtype
+        if not isinstance(dtype, type):
+            try:
+                dtype = self.__resolve_dtype__(dtype, data)
+            except Exception as exc:
+                msg = 'cannot add %s to %s - could not determine type' % (name, parent.name)  # noqa: F821
+                raise Exception(msg) from exc
+
+        # Set the type_str
+        type_str = self.__serial_dtype__(dtype)
+
+        # Determine the shape and update the dtype if necessary when dtype==object
+        if 'shape' in io_settings:  # Use the shape set by the user
+            data_shape = io_settings.pop('shape')
+        # If we have a numeric numpy array then use its shape
+        elif isinstance(dtype, np.dtype) and np.issubdtype(dtype, np.number) or dtype == np.bool_:
+            data_shape = get_data_shape(data)
+        # Deal with object dtype
+        elif isinstance(dtype, np.dtype):
+            data = data[:]  # load the data in case we come from HDF5 or another on-disk data source we don't know
+            data_shape = (len(data), )
+            # if we have a compound data type
+            if dtype.names:
+                data_shape = get_data_shape(data)
+                # If strings are part of our compound type then we need to use Object type instead
+                # otherwise we try to keep the native compound datatype that numpy is using
+                for substype in dtype.fields.items():
+                    if np.issubdtype(substype[1][0], np.flexible) or np.issubdtype(substype[1][0], np.object_):
+                        dtype = object
+                        io_settings['object_codec'] = self.__codec_cls()
+                        break
+            # sometimes bytes and strings can hide as object in numpy array so lets try
+            # to write those as strings and bytes rather than as objects
+            elif len(data) > 0 and isinstance(data, np.ndarray):
+                if isinstance(data.item(0), bytes):
+                    dtype = bytes
+                    data_shape = get_data_shape(data)
+                elif isinstance(data.item(0), str):
+                    dtype = str
+                    data_shape = get_data_shape(data)
+            # Set encoding for objects
+            else:
+                dtype = object
+                io_settings['object_codec'] = self.__codec_cls()
+        # Determine the shape from the data if all other cases have not been hit
+        else:
+            data_shape = get_data_shape(data)
+
+        # Create the dataset
+        dset = parent.require_dataset(name, shape=data_shape, dtype=dtype, **io_settings)
+        dset.attrs['zarr_dtype'] = type_str
+
+        # Write the data to file
+        if dtype == object:
+            for c in np.ndindex(data_shape):
+                o = data
+                for i in c:
+                    o = o[i]
+                # bytes are not JSON serializable
+                dset[c] = o if not isinstance(o, (bytes, np.bytes_)) else o.decode("utf-8")
+            return dset
+        # standard write
+        else:
+            try:
+                dset[:] = data  # If data is an h5py.Dataset then this will copy the data
+            # For compound data types containing strings Zarr sometimes does not like wirting multiple values
+            # try to write them one-at-a-time instead then
+            except ValueError:
+                for i in range(len(data)):
+                    dset[i] = data[i]
+        return dset
+
+    def __scalar_fill__(self, parent, name, data, options=None):
+        dtype = None
+        io_settings = dict()
+        if options is not None:
+            dtype = options.get('dtype')
+            io_settings = options.get('io_settings')
+            if io_settings is None:
+                io_settings = dict()
+        if not isinstance(dtype, type):
+            try:
+                dtype = self.__resolve_dtype__(dtype, data)
+            except Exception as exc:
+                msg = 'cannot add %s to %s - could not determine type' % (name, parent.name)
+                raise Exception(msg) from exc
+        if dtype == object:
+            io_settings['object_codec'] = self.__codec_cls()
+
+        dset = parent.require_dataset(name, shape=(1, ), dtype=dtype, **io_settings)
+        dset[:] = data
+        type_str = 'scalar'
+        dset.attrs['zarr_dtype'] = type_str
+        return dset
+
+    @docval(returns='a GroupBuilder representing the NWB Dataset', rtype='GroupBuilder')
+    def read_builder(self):
+        f_builder = self.__read_group(self.__file, ROOT_NAME)
+        return f_builder
+
+    def __set_built(self, zarr_obj, builder):
+        fpath = zarr_obj.store.path
+        path = zarr_obj.path
+        path = os.path.join(fpath, path)
+        self.__built.setdefault(path, builder)
+
+    @docval({'name': 'zarr_obj', 'type': (Array, Group),
+             'doc': 'the Zarr object to the corresponding Container/Data object for'})
+    def get_container(self, **kwargs):
+        """
+        Get the container for the corresponding Zarr Group or Dataset
+
+        :raises ValueError: When no builder has been constructed yet for the given h5py object
+        """
+        zarr_obj = getargs('zarr_obj', kwargs)
+        builder = self.get_builder(zarr_obj)
+        container = self.manager.construct(builder)
+        return container  # TODO: This method should be moved to HDMFIO
+
+    @docval({'name': 'zarr_obj', 'type': (Array, Group),
+             'doc': 'the Zarr object to the corresponding Builder object for'})
+    def get_builder(self, **kwargs):  # TODO: move this to HDMFIO (define skeleton in there at least)
+        """
+        Get the builder for the corresponding Group or Dataset
+
+        :raises ValueError: When no builder has been constructed
+        """
+        zarr_obj = kwargs['zarr_obj']
+        builder = self.__get_built(zarr_obj)
+        if builder is None:
+            msg = '%s has not been built' % (zarr_obj.name)
+            raise ValueError(msg)
+        return builder
+
+    def __get_built(self, zarr_obj):
+        """
+        Look up a builder for the given zarr object
+        :param zarr_obj: The Zarr object to be built
+        :type zarr_obj: Zarr Group or Dataset
+        :return: Builder in the self.__built cache or None
+        """
+        fpath = zarr_obj.store.path
+        path = zarr_obj.path
+        path = os.path.join(fpath, path)
+        return self.__built.get(path, None)
+
+    def __read_group(self, zarr_obj, name=None):
+        ret = self.__get_built(zarr_obj)
+        if ret is not None:
+            return ret
+
+        if name is None:
+            name = str(os.path.basename(zarr_obj.name))
+
+        # Create the GroupBuilder
+        attributes = self.__read_attrs(zarr_obj)
+        ret = GroupBuilder(name=name, source=self.source, attributes=attributes)
+        ret.location = self.get_zarr_parent_path(zarr_obj)
+
+        # read sub groups
+        for sub_name, sub_group in zarr_obj.groups():
+            sub_builder = self.__read_group(sub_group, sub_name)
+            ret.set_group(sub_builder)
+
+        # read sub datasets
+        for sub_name, sub_array in zarr_obj.arrays():
+            sub_builder = self.__read_dataset(sub_array, sub_name)
+            ret.set_dataset(sub_builder)
+
+        # read the links
+        self.__read_links(zarr_obj=zarr_obj, parent=ret)
+
+        self._written_builders.set_written(ret)  # record that the builder has been written
+        self.__set_built(zarr_obj, ret)
+        return ret
+
+    def __read_links(self, zarr_obj, parent):
+        """
+        Read the links associated with a zarr group
+        :param zarr_obj: The Zarr group we should read links from
+        :type zarr_obj: zarr.hiearchy.Group
+        :param parent: GroupBuilder with which the links need to be associated
+        :type parent: GroupBuilder
+        """
+        # read links
+        if 'zarr_link' in zarr_obj.attrs:
+            links = zarr_obj.attrs['zarr_link']
+            for link in links:
+                link_name = link['name']
+                target_name, target_zarr_obj = self.resolve_ref(link)
+                # NOTE: __read_group and __read_dataset return the cached builders if the target has already been built
+                if isinstance(target_zarr_obj, Group):
+                    builder = self.__read_group(target_zarr_obj, target_name)
+                else:
+                    builder = self.__read_dataset(target_zarr_obj, target_name)
+                link_builder = LinkBuilder(builder=builder, name=link_name, source=self.source)
+                link_builder.location = os.path.join(parent.location, parent.name)
+                self._written_builders.set_written(link_builder)  # record that the builder has been written
+                parent.set_link(link_builder)
+
+    def __read_dataset(self, zarr_obj, name):
+        ret = self.__get_built(zarr_obj)
+        if ret is not None:
+            return ret
+
+        if 'zarr_dtype' in zarr_obj.attrs:
+            zarr_dtype = zarr_obj.attrs['zarr_dtype']
+        elif hasattr(zarr_obj, 'dtype'):   # Fallback for invalid files that are mssing zarr_type
+            zarr_dtype = zarr_obj.dtype
+            warnings.warn(
+                "Inferred dtype from zarr type. Dataset missing zarr_dtype: " + str(name) + "   " + str(zarr_obj)
+            )
+        else:
+            raise ValueError("Dataset missing zarr_dtype: " + str(name) + "   " + str(zarr_obj))
+
+        kwargs = {"attributes": self.__read_attrs(zarr_obj),
+                  "dtype": zarr_dtype,
+                  "maxshape": zarr_obj.shape,
+                  "chunks": not (zarr_obj.shape == zarr_obj.chunks),
+                  "source": self.source}
+        dtype = kwargs['dtype']
+
+        # By default, use the zarr.core.Array as data for lazy data load
+        data = zarr_obj
+
+        # Read scalar dataset
+        if dtype == 'scalar':
+            data = zarr_obj[0]
+
+        if isinstance(dtype, list):
+            # Check compound dataset where one of the subsets contains references
+            has_reference = False
+            for i, dts in enumerate(dtype):
+                if dts['dtype'] in ['object', 'region']:  # check items for object reference
+                    has_reference = True
+                    break
+            retrieved_dtypes = [dtype_dict['dtype'] for dtype_dict in dtype]
+            if has_reference:
+                # TODO:  BuilderZarrTableDataset does not yet support region reference
+                data = BuilderZarrTableDataset(zarr_obj, self, retrieved_dtypes)
+        elif self.__is_ref(dtype):
+            # Array of references
+            if dtype == 'object':
+                data = BuilderZarrReferenceDataset(data, self)
+            # TODO: Resolution of Region reference not yet supported by BuilderZarrRegionDataset
+            # elif dtype == 'region':
+            #     data = BuilderZarrRegionDataset(data, self)
+
+        kwargs['data'] = data
+        if name is None:
+            name = str(os.path.basename(zarr_obj.name))
+        ret = DatasetBuilder(name, **kwargs)  # create builder object for dataset
+        ret.location = self.get_zarr_parent_path(zarr_obj)
+        self._written_builders.set_written(ret)  # record that the builder has been written
+        self.__set_built(zarr_obj, ret)
+        return ret
+
+    def __read_attrs(self, zarr_obj):
+        ret = dict()
+        for k in zarr_obj.attrs.keys():
+            if k not in self.__reserve_attribute:
+                v = zarr_obj.attrs[k]
+                if isinstance(v, dict) and 'zarr_dtype' in v:
+                    if v['zarr_dtype'] == 'object':
+                        target_name, target_zarr_obj = self.resolve_ref(v['value'])
+                        if isinstance(target_zarr_obj, zarr.hierarchy.Group):
+                            ret[k] = self.__read_group(target_zarr_obj, target_name)
+                        else:
+                            ret[k] = self.__read_dataset(target_zarr_obj, target_name)
+                    # TODO Need to implement region references for attributes
+                    elif v['zarr_dtype'] == 'region':
+                        raise NotImplementedError("Read of region references from attributes not implemented in ZarrIO")
+                    else:
+                        raise NotImplementedError("Unsupported zarr_dtype for attribute " + str(v))
+                else:
+                    ret[k] = v
+        return ret