make shard_format configurable, add bitmask for uncompressed chunks

jstriebel · jstriebel · commit 7e2768ac8f44 · 2021-11-26T13:44:43.000+01:00
diff --git a/chunking_test.py b/chunking_test.py
@@ -4,17 +4,18 @@
 import zarr
 
 store = zarr.DirectoryStore("data/chunking_test.zarr")
-z = zarr.zeros((20, 3), chunks=(3, 3), shards=(2, 2), store=store, overwrite=True, compressor=None)
-z[...] = 42
+z = zarr.zeros((20, 3), chunks=(3, 2), shards=(2, 2), store=store, overwrite=True, compressor=None)
+z[:10, :] = 42
 z[15, 1] = 389
 z[19, 2] = 1
 z[0, 1] = -4.2
 
+print(store[".zarray"].decode())
 print("ONDISK", sorted(os.listdir("data/chunking_test.zarr")))
 assert json.loads(store[".zarray"].decode()) ["shards"] == [2, 2]
 
-print("STORE", list(store))
-print("CHUNKSTORE (SHARDED)", list(z.chunk_store))
+print("STORE", sorted(store))
+print("CHUNKSTORE (SHARDED)", sorted(z.chunk_store))
 
 z_reopened = zarr.open("data/chunking_test.zarr")
 assert z_reopened.shards == (2, 2)
diff --git a/zarr/_storage/sharded_store.py b/zarr/_storage/sharded_store.py
@@ -1,6 +1,7 @@
+from collections import defaultdict
 from functools import reduce
-from itertools import product
-from typing import Any, Iterable, Iterator, Optional, Tuple
+import math
+from typing import Any, Dict, Iterable, Iterator, List, Tuple, Union
 
 import numpy as np
 
@@ -16,7 +17,7 @@ def _cum_prod(x: Iterable[int]) -> Iterable[int]:
         yield prod
 
 
-class ShardedStore(Store):
+class MortonOrderShardedStore(Store):
     """This class should not be used directly,
     but is added to an Array as a wrapper when needed automatically."""
 
@@ -32,59 +33,97 @@ def __init__(
     ) -> None:
         self._store: BaseStore = BaseStore._ensure_store(store)
         self._shards = shards
-        # This defines C/F-order
-        self._shard_strides = tuple(_cum_prod(shards))
         self._num_chunks_per_shard = reduce(lambda x, y: x*y, shards, 1)
         self._dimension_separator = dimension_separator
-        # TODO: add jumptable for compressed data
+
         chunk_has_constant_size = not are_chunks_compressed and not dtype == object
         assert chunk_has_constant_size, "Currently only uncompressed, fixed-length data can be used."
         self._chunk_has_constant_size = chunk_has_constant_size
         if chunk_has_constant_size:
             binary_fill_value = np.full(1, fill_value=fill_value or 0, dtype=dtype).tobytes()
             self._fill_chunk = binary_fill_value * chunk_size
-        else:
-            self._fill_chunk = None
+            self._emtpy_meta = b"\x00" * math.ceil(self._num_chunks_per_shard / 8)
+
+        # unused when using Morton order
+        self._shard_strides = tuple(_cum_prod(shards))
 
         # TODO: add warnings for ineffective reads/writes:
         # * warn if partial reads are not available
         # * optionally warn on unaligned writes if no partial writes are available
-  
-    def __key_to_sharded__(self, key: str) -> Tuple[str, int]:
+
+    def __get_meta__(self, shard_content: Union[bytes, bytearray]) -> int:
+        return int.from_bytes(shard_content[-len(self._emtpy_meta):], byteorder="big")
+
+    def __set_meta__(self, shard_content: bytearray, meta: int) -> None:
+        shard_content[-len(self._emtpy_meta):] = meta.to_bytes(len(self._emtpy_meta), byteorder="big")
+
+    # The following two methods define the order of the chunks in a shard
+    # TODO use morton order
+    def __chunk_key_to_shard_key_and_index__(self, chunk_key: str) -> Tuple[str, int]:
         # TODO: allow to be in a group (aka only use last parts for dimensions)
-        subkeys = map(int, key.split(self._dimension_separator))
+        chunk_subkeys = map(int, chunk_key.split(self._dimension_separator))
 
-        shard_tuple, index_tuple = zip(*((subkey // shard_i, subkey % shard_i) for subkey, shard_i in zip(subkeys, self._shards)))
+        shard_tuple, index_tuple = zip(*((subkey // shard_i, subkey % shard_i) for subkey, shard_i in zip(chunk_subkeys, self._shards)))
         shard_key = self._dimension_separator.join(map(str, shard_tuple))
         index = sum(i * j for i, j in zip(index_tuple, self._shard_strides))
         return shard_key, index
 
-    def __get_chunk_slice__(self, shard_key: str, shard_index: int) -> Tuple[int, int]:
-        # TODO: here we would use the jumptable for compression, which uses shard_key
+    def __shard_key_and_index_to_chunk_key__(self, shard_key_tuple: Tuple[int, ...], shard_index: int) -> str:
+        offset = tuple(shard_index % s2 // s1 for s1, s2 in zip(self._shard_strides, self._shard_strides[1:] + (self._num_chunks_per_shard,)))
+        original_key = (shard_key_i * shards_i + offset_i for shard_key_i, offset_i, shards_i in zip(shard_key_tuple, offset, self._shards))
+        return self._dimension_separator.join(map(str, original_key))
+
+    def __keys_to_shard_groups__(self, keys: Iterable[str]) -> Dict[str, List[Tuple[str, str]]]:
+        shard_indices_per_shard_key = defaultdict(list)
+        for chunk_key in keys:
+            shard_key, shard_index = self.__chunk_key_to_shard_key_and_index__(chunk_key)
+            shard_indices_per_shard_key[shard_key].append((shard_index, chunk_key))
+        return shard_indices_per_shard_key
+
+    def __get_chunk_slice__(self, shard_index: int) -> Tuple[int, int]:
         start = shard_index * len(self._fill_chunk)
         return slice(start, start + len(self._fill_chunk))
 
     def __getitem__(self, key: str) -> bytes:
-        shard_key, shard_index = self.__key_to_sharded__(key)
-        chunk_slice = self.__get_chunk_slice__(shard_key, shard_index)
-        # TODO use partial reads if available
-        full_shard_value = self._store[shard_key]
-        return full_shard_value[chunk_slice]
+        return self.getitems([key])[key]
+
+    def getitems(self, keys: Iterable[str], **kwargs) -> Dict[str, bytes]:
+        result = {}
+        for shard_key, chunks_in_shard in self.__keys_to_shard_groups__(keys).items():
+            # TODO use partial reads if available
+            full_shard_value = self._store[shard_key]
+            # TODO omit items if they don't exist
+            for shard_index, chunk_key in chunks_in_shard:
+                result[chunk_key] = full_shard_value[self.__get_chunk_slice__(shard_index)]
+        return result
 
     def __setitem__(self, key: str, value: bytes) -> None:
-        shard_key, shard_index = self.__key_to_sharded__(key)
-        if shard_key in self._store:
-            full_shard_value = bytearray(self._store[shard_key])
-        else:
-            full_shard_value = bytearray(self._fill_chunk * self._num_chunks_per_shard)
-        chunk_slice = self.__get_chunk_slice__(shard_key, shard_index)
-        # TODO use partial writes if available
-        full_shard_value[chunk_slice] = value
-        self._store[shard_key] = full_shard_value
+        self.setitems({key: value})
+
+    def setitems(self, values: Dict[str, bytes]) -> None:
+        for shard_key, chunks_in_shard in self.__keys_to_shard_groups__(values.keys()).items():
+            if len(chunks_in_shard) == self._num_chunks_per_shard:
+                # TODO shards at a non-dataset-size aligned surface are not captured here yet
+                full_shard_value = b"".join(
+                    values[chunk_key] for _, chunk_key in sorted(chunks_in_shard)
+                ) + b"\xff" * len(self._emtpy_meta)
+                self._store[shard_key] = full_shard_value
+            else:
+                # TODO use partial writes if available
+                try:
+                    full_shard_value = bytearray(self._store[shard_key])
+                except KeyError:
+                    full_shard_value = bytearray(self._fill_chunk * self._num_chunks_per_shard + self._emtpy_meta)
+                chunk_mask = self.__get_meta__(full_shard_value)
+                for shard_index, chunk_key in chunks_in_shard:
+                    chunk_mask |= 1 << shard_index
+                    full_shard_value[self.__get_chunk_slice__(shard_index)] = values[chunk_key]
+                self.__set_meta__(full_shard_value, chunk_mask)
+                self._store[shard_key] = full_shard_value
 
     def __delitem__(self, key) -> None:
-        # TODO not implemented yet
-        # For uncompressed chunks, deleting the "last" chunk might need to be detected.
+        # TODO not implemented yet, also delitems
+        # Deleting the "last" chunk in a shard needs to remove the whole shard
         raise NotImplementedError("Deletion is not yet implemented")
 
     def __iter__(self) -> Iterator[str]:
@@ -94,16 +133,20 @@ def __iter__(self) -> Iterator[str]:
                 yield shard_key
             else:
                 # For each shard key in the wrapped store, all corresponding chunks are yielded.
-                # TODO: For compressed chunks we might yield only the actualy contained chunks by reading the jumptables.
                 # TODO: allow to be in a group (aka only use last parts for dimensions)
-                subkeys = tuple(map(int, shard_key.split(self._dimension_separator)))
-                for offset in product(*(range(i) for i in self._shards)):
-                    original_key = (subkeys_i * shards_i + offset_i for subkeys_i, offset_i, shards_i in zip(subkeys, offset, self._shards))
-                    yield self._dimension_separator.join(map(str, original_key))
+                shard_key_tuple = tuple(map(int, shard_key.split(self._dimension_separator)))
+                mask = self.__get_meta__(self._store[shard_key])
+                for i in range(self._num_chunks_per_shard):
+                    if mask == 0:
+                        break
+                    if mask & 1:
+                        yield self.__shard_key_and_index_to_chunk_key__(shard_key_tuple, i)
+                    mask >>= 1
 
     def __len__(self) -> int:
         return sum(1 for _ in self.keys())
 
-    # TODO: For efficient reads and writes, we need to implement
-    # getitems, setitems & delitems
-    # and combine writes/reads/deletions to the same shard.
+
+SHARDED_STORES = {
+    "morton_order": MortonOrderShardedStore,
+}
diff --git a/zarr/core.py b/zarr/core.py
@@ -11,7 +11,7 @@
 from numcodecs.compat import ensure_bytes, ensure_ndarray
 
 from collections.abc import MutableMapping
-from zarr._storage.sharded_store import ShardedStore
+from zarr._storage.sharded_store import SHARDED_STORES
 
 from zarr.attrs import Attributes
 from zarr.codecs import AsType, get_codec
@@ -219,6 +219,7 @@ def _load_metadata_nosync(self):
             self._shape = meta['shape']
             self._chunks = meta['chunks']
             self._shards = meta.get('shards')
+            self._shard_format = meta.get('shard_format')
             self._dtype = meta['dtype']
             self._fill_value = meta['fill_value']
             self._order = meta['order']
@@ -272,7 +273,8 @@ def _flush_metadata_nosync(self):
         # should the dimension_separator also be included in this dict?
         meta = dict(shape=self._shape, chunks=self._chunks, dtype=self._dtype,
                     compressor=compressor_config, fill_value=self._fill_value,
-                    order=self._order, filters=filters_config, shards=self._shards)
+                    order=self._order, filters=filters_config,
+                    shards=self._shards, shard_format=self._shard_format)
         mkey = self._key_prefix + array_meta_key
         self._store[mkey] = self._store._metadata_class.encode_array_metadata(meta)
 
@@ -324,7 +326,7 @@ def chunk_store(self):
             return chunk_store
         else:
             if self._cached_sharded_store is None:
-                self._cached_sharded_store = ShardedStore(
+                self._cached_sharded_store = SHARDED_STORES[self._shard_format](
                     chunk_store,
                     shards=self._shards,
                     dimension_separator=self._dimension_separator,
@@ -1731,7 +1733,7 @@ def _set_selection(self, indexer, value, fields=None):
             check_array_shape('value', value, sel_shape)
 
         # iterate over chunks in range
-        if not hasattr(self.store, "setitems") or self._synchronizer is not None \
+        if not hasattr(self.chunk_store, "setitems") or self._synchronizer is not None \
            or any(map(lambda x: x == 0, self.shape)):
             # iterative approach
             for chunk_coords, chunk_selection, out_selection in indexer:
@@ -1974,8 +1976,8 @@ def _chunk_setitems(self, lchunk_coords, lchunk_selection, values, fields=None):
         self.chunk_store.setitems(to_store)
 
     def _chunk_delitems(self, ckeys):
-        if hasattr(self.store, "delitems"):
-            self.store.delitems(ckeys)
+        if hasattr(self.chunk_store, "delitems"):
+            self.chunk_store.delitems(ckeys)
         else:  # pragma: no cover
             # exempting this branch from coverage as there are no extant stores
             # that will trigger this condition, but it's possible that they
diff --git a/zarr/creation.py b/zarr/creation.py
@@ -21,7 +21,7 @@ def create(shape, chunks=True, dtype=None, compressor='default',
            overwrite=False, path=None, chunk_store=None, filters=None,
            cache_metadata=True, cache_attrs=True, read_only=False,
            object_codec=None, dimension_separator=None, write_empty_chunks=True,
-           shards: Union[int, Tuple[int, ...], None]=None, **kwargs):
+           shards: Union[int, Tuple[int, ...], None]=None, shard_format: str="morton_order", **kwargs):
     """Create an array.
 
     Parameters
@@ -147,7 +147,7 @@ def create(shape, chunks=True, dtype=None, compressor='default',
     init_array(store, shape=shape, chunks=chunks, dtype=dtype, compressor=compressor,
                fill_value=fill_value, order=order, overwrite=overwrite, path=path,
                chunk_store=chunk_store, filters=filters, object_codec=object_codec,
-               dimension_separator=dimension_separator, shards=shards)
+               dimension_separator=dimension_separator, shards=shards, shard_format=shard_format)
 
     # instantiate array
     z = Array(store, path=path, chunk_store=chunk_store, synchronizer=synchronizer,
diff --git a/zarr/meta.py b/zarr/meta.py
@@ -52,6 +52,7 @@ def decode_array_metadata(cls, s: Union[MappingType, str]) -> MappingType[str, A
 
             dimension_separator = meta.get("dimension_separator", None)
             shards = meta.get("shards", None)
+            shard_format = meta.get("shard_format", None)
             fill_value = cls.decode_fill_value(meta['fill_value'], dtype, object_codec)
             meta = dict(
                 zarr_format=meta["zarr_format"],
@@ -67,6 +68,8 @@ def decode_array_metadata(cls, s: Union[MappingType, str]) -> MappingType[str, A
                 meta['dimension_separator'] = dimension_separator
             if shards:
                 meta['shards'] = tuple(shards)
+                assert shard_format is not None
+                meta['shard_format'] = shard_format
         except Exception as e:
             raise MetadataError("error decoding metadata") from e
         else:
@@ -81,6 +84,7 @@ def encode_array_metadata(cls, meta: MappingType[str, Any]) -> bytes:
 
         dimension_separator = meta.get("dimension_separator")
         shards = meta.get("shards")
+        shard_format = meta.get("shard_format")
         if dtype.hasobject:
             import numcodecs
             object_codec = numcodecs.get_codec(meta['filters'][0])
@@ -99,9 +103,10 @@ def encode_array_metadata(cls, meta: MappingType[str, Any]) -> bytes:
         )
         if dimension_separator:
             meta['dimension_separator'] = dimension_separator
-
         if shards:
             meta['shards'] = shards
+            assert shard_format is not None
+            meta['shard_format'] = shard_format
 
         return json_dumps(meta)
 
diff --git a/zarr/storage.py b/zarr/storage.py
@@ -237,6 +237,7 @@ def init_array(
     object_codec=None,
     dimension_separator=None,
     shards: Union[int, Tuple[int, ...], None]=None,
+    shard_format: Optional[str]=None,
 ):
     """Initialize an array store with the given configuration. Note that this is a low-level
     function and there should be no need to call this directly from user code.
@@ -355,7 +356,7 @@ def init_array(
                          chunk_store=chunk_store, filters=filters,
                          object_codec=object_codec,
                          dimension_separator=dimension_separator,
-                         shards=shards)
+                         shards=shards, shard_format=shard_format)
 
 
 def _init_array_metadata(
@@ -373,6 +374,7 @@ def _init_array_metadata(
     object_codec=None,
     dimension_separator=None,
     shards:Union[int, Tuple[int, ...], None] = None,
+    shard_format: Optional[str]=None,
 ):
 
     # guard conditions
@@ -392,6 +394,7 @@ def _init_array_metadata(
     dtype = dtype.base
     chunks = normalize_chunks(chunks, shape, dtype.itemsize)
     shards = normalize_shards(shards, shape)
+    shard_format = shard_format or "morton_order"
     order = normalize_order(order)
     fill_value = normalize_fill_value(fill_value, dtype)
 
@@ -451,6 +454,7 @@ def _init_array_metadata(
                 dimension_separator=dimension_separator)
     if shards is not None:
         meta["shards"] = shards
+        meta["shard_format"] = shard_format
     key = _path_to_prefix(path) + array_meta_key
     if hasattr(store, '_metadata_class'):
         store[key] = store._metadata_class.encode_array_metadata(meta)  # type: ignore