experimental

Experimental functionality is not stable and may change or be removed at any point.

Classes¶

zarr.experimental.cache_store ¶

logger `module-attribute` ¶

logger = getLogger(__name__)

CacheStore ¶

Bases: WrapperStore[Store]

A dual-store caching implementation for Zarr stores.

This cache wraps any Store implementation and uses a separate Store instance as the cache backend. This provides persistent caching capabilities with time-based expiration, size-based eviction, and flexible cache storage options.

Full-key reads are cached in the Store-backed cache. Byte-range reads are cached in a separate in-memory dictionary so that partial reads never pollute the filesystem (or other persistent backend). Both caches share the same max_size budget and LRU eviction policy.

Parameters:

store (Store) –

The underlying store to wrap with caching
cache_store (Store) –

The store to use for caching (can be any Store implementation)
max_age_seconds (int | None, default: 'infinity' ) –

Maximum age of cached entries in seconds. None means no expiration. Default is None.
max_size (int | None, default: None ) –

Maximum size of the cache in bytes. When exceeded, least recently used items are evicted. None means unlimited size. Default is None. Note: Individual values larger than max_size will not be cached.
cache_set_data (bool, default: True ) –

Whether to cache data when it's written to the store. Default is True.

Examples:

import zarr
from zarr.storage import MemoryStore
from zarr.experimental.cache_store import CacheStore

# Create a cached store
source_store = MemoryStore()
cache_store = MemoryStore()
cached_store = CacheStore(
    store=source_store,
    cache_store=cache_store,
    max_age_seconds=60,
    max_size=1024*1024
)

# Use it like any other store
array = zarr.create(shape=(100,), store=cached_store)
array[:] = 42

Source code in zarr/experimental/cache_store.py

class CacheStore(WrapperStore[Store]):
    """
    A dual-store caching implementation for Zarr stores.

    This cache wraps any Store implementation and uses a separate Store instance
    as the cache backend. This provides persistent caching capabilities with
    time-based expiration, size-based eviction, and flexible cache storage options.

    Full-key reads are cached in the Store-backed cache.  Byte-range reads are
    cached in a separate in-memory dictionary so that partial reads never
    pollute the filesystem (or other persistent backend).  Both caches share
    the same ``max_size`` budget and LRU eviction policy.

    Parameters
    ----------
    store : Store
        The underlying store to wrap with caching
    cache_store : Store
        The store to use for caching (can be any Store implementation)
    max_age_seconds : int | None, optional
        Maximum age of cached entries in seconds. None means no expiration.
        Default is None.
    max_size : int | None, optional
        Maximum size of the cache in bytes. When exceeded, least recently used
        items are evicted. None means unlimited size. Default is None.
        Note: Individual values larger than max_size will not be cached.
    cache_set_data : bool, optional
        Whether to cache data when it's written to the store. Default is True.

    Examples
    --------
    ```python
    import zarr
    from zarr.storage import MemoryStore
    from zarr.experimental.cache_store import CacheStore

    # Create a cached store
    source_store = MemoryStore()
    cache_store = MemoryStore()
    cached_store = CacheStore(
        store=source_store,
        cache_store=cache_store,
        max_age_seconds=60,
        max_size=1024*1024
    )

    # Use it like any other store
    array = zarr.create(shape=(100,), store=cached_store)
    array[:] = 42
    ```

    """

    _cache: Store
    max_age_seconds: int | Literal["infinity"]
    max_size: int | None
    cache_set_data: bool
    _state: _CacheState

    def __init__(
        self,
        store: Store,
        *,
        cache_store: Store,
        max_age_seconds: int | str = "infinity",
        max_size: int | None = None,
        cache_set_data: bool = True,
    ) -> None:
        super().__init__(store)

        if not cache_store.supports_deletes:
            msg = (
                f"The provided cache store {cache_store} does not support deletes. "
                "The cache_store must support deletes for CacheStore to function properly."
            )
            raise ValueError(msg)

        self._cache = cache_store
        # Validate and set max_age_seconds
        if isinstance(max_age_seconds, str):
            if max_age_seconds != "infinity":
                raise ValueError("max_age_seconds string value must be 'infinity'")
            self.max_age_seconds = "infinity"
        else:
            self.max_age_seconds = max_age_seconds
        self.max_size = max_size
        self.cache_set_data = cache_set_data
        self._state = _CacheState()

    def _with_store(self, store: Store) -> Self:
        # Cannot support this operation because it would share a cache, but have a new store
        # So cache keys would conflict
        raise NotImplementedError("CacheStore does not support this operation.")

    def with_read_only(self, read_only: bool = False) -> Self:
        # Create a new cache store that shares the same cache and mutable state
        store = type(self)(
            store=self._store.with_read_only(read_only),
            cache_store=self._cache,
            max_age_seconds=self.max_age_seconds,
            max_size=self.max_size,
            cache_set_data=self.cache_set_data,
        )
        store._state = self._state
        return store

    def _is_key_fresh(self, entry_key: _CacheEntryKey) -> bool:
        """Check if a cached entry is still fresh based on max_age_seconds.

        Uses monotonic time for accurate elapsed time measurement.
        """
        if self.max_age_seconds == "infinity":
            return True
        now = time.monotonic()
        elapsed = now - self._state.key_insert_times.get(entry_key, 0)
        return elapsed < self.max_age_seconds

    async def _accommodate_value(self, value_size: int) -> None:
        """Ensure there is enough space in the cache for a new value.

        Must be called while holding self._state.lock.
        """
        if self.max_size is None:
            return

        # Remove least recently used items until we have enough space
        while self._state.current_size + value_size > self.max_size and self._state.cache_order:
            # Get the least recently used key (first in OrderedDict)
            lru_key = next(iter(self._state.cache_order))
            await self._evict_key(lru_key)

    async def _evict_key(self, entry_key: _CacheEntryKey) -> None:
        """Evict a cache entry.

        Must be called while holding self._state.lock.

        For ``str`` keys the entry is deleted from the Store-backed cache.
        For ``(str, ByteRequest)`` keys the entry is removed from the
        in-memory range cache.
        """
        key_size = self._state.key_sizes.get(entry_key, 0)

        if isinstance(entry_key, str):
            await self._cache.delete(entry_key)
        else:
            base_key, byte_range = entry_key
            per_key = self._state.range_cache.get(base_key)
            if per_key is not None:
                per_key.pop(byte_range, None)
                if not per_key:
                    del self._state.range_cache[base_key]

        self._state.cache_order.pop(entry_key, None)
        self._state.key_insert_times.pop(entry_key, None)
        self._state.key_sizes.pop(entry_key, None)
        self._state.current_size = max(0, self._state.current_size - key_size)
        self._state.evictions += 1

    async def _track_entry(self, entry_key: _CacheEntryKey, value: Buffer) -> bool:
        """Register *entry_key* in the shared size / LRU tracking.

        Returns ``True`` if the entry was tracked, ``False`` if the value
        exceeds ``max_size`` and was skipped.  Callers should roll back any
        data they already stored when this returns ``False``.

        This method holds the lock for the entire operation to ensure atomicity.
        """
        value_size = len(value)

        # Check if value exceeds max size
        if self.max_size is not None and value_size > self.max_size:
            return False

        async with self._state.lock:
            # If key already exists, subtract old size first
            if entry_key in self._state.key_sizes:
                old_size = self._state.key_sizes[entry_key]
                self._state.current_size -= old_size

            # Make room for the new value
            await self._accommodate_value(value_size)

            # Update tracking atomically
            self._state.cache_order[entry_key] = None
            self._state.current_size += value_size
            self._state.key_sizes[entry_key] = value_size
            self._state.key_insert_times[entry_key] = time.monotonic()

        return True

    async def _update_access_order(self, entry_key: _CacheEntryKey) -> None:
        """Update the access order for LRU tracking."""
        if entry_key in self._state.cache_order:
            async with self._state.lock:
                self._state.cache_order.move_to_end(entry_key)

    def _remove_from_tracking(self, entry_key: _CacheEntryKey) -> None:
        """Remove an entry from all tracking structures.

        Must be called while holding self._state.lock.
        """
        self._state.cache_order.pop(entry_key, None)
        self._state.key_insert_times.pop(entry_key, None)
        self._state.key_sizes.pop(entry_key, None)

    def _invalidate_range_entries(self, key: str) -> None:
        """Remove all byte-range entries for *key* from the range cache and tracking.

        Must be called while holding self._state.lock.
        """
        per_key = self._state.range_cache.pop(key, None)
        if per_key is not None:
            for byte_range in per_key:
                entry_key: _CacheEntryKey = (key, byte_range)
                entry_size = self._state.key_sizes.pop(entry_key, 0)
                self._state.cache_order.pop(entry_key, None)
                self._state.key_insert_times.pop(entry_key, None)
                self._state.current_size = max(0, self._state.current_size - entry_size)

    # ------------------------------------------------------------------
    # get helpers
    # ------------------------------------------------------------------

    async def _cache_miss(
        self, key: str, byte_range: ByteRequest | None, result: Buffer | None
    ) -> None:
        """Handle a cache miss by storing or cleaning up after a source-store fetch."""
        if result is None:
            if byte_range is None:
                await self._cache.delete(key)
                async with self._state.lock:
                    self._remove_from_tracking(key)
            else:
                entry_key: _CacheEntryKey = (key, byte_range)
                async with self._state.lock:
                    per_key = self._state.range_cache.get(key)
                    if per_key is not None:
                        per_key.pop(byte_range, None)
                        if not per_key:
                            del self._state.range_cache[key]
                    self._remove_from_tracking(entry_key)
        else:
            if byte_range is None:
                await self._cache.set(key, result)
                await self._track_entry(key, result)
            else:
                entry_key = (key, byte_range)
                self._state.range_cache.setdefault(key, {})[byte_range] = result
                tracked = await self._track_entry(entry_key, result)
                if not tracked:
                    # Value too large for the cache — roll back the insertion
                    per_key = self._state.range_cache.get(key)
                    if per_key is not None:
                        per_key.pop(byte_range, None)
                        if not per_key:
                            del self._state.range_cache[key]

    async def _get_try_cache(
        self, key: str, prototype: BufferPrototype, byte_range: ByteRequest | None = None
    ) -> Buffer | None:
        """Try to get data from cache first, falling back to source store."""
        if byte_range is None:
            # Full-key read — use Store-backed cache
            maybe_cached = await self._cache.get(key, prototype)
            if maybe_cached is not None:
                self._state.hits += 1
                await self._update_access_order(key)
                return maybe_cached
        else:
            # Byte-range read — use in-memory range cache
            entry_key: _CacheEntryKey = (key, byte_range)
            per_key = self._state.range_cache.get(key)
            if per_key is not None:
                cached_buf = per_key.get(byte_range)
                if cached_buf is not None:
                    self._state.hits += 1
                    await self._update_access_order(entry_key)
                    return cached_buf

        # Cache miss — fetch from source store
        self._state.misses += 1
        result = await super().get(key, prototype, byte_range)
        await self._cache_miss(key, byte_range, result)
        return result

    async def _get_no_cache(
        self, key: str, prototype: BufferPrototype, byte_range: ByteRequest | None = None
    ) -> Buffer | None:
        """Get data directly from source store and update cache."""
        self._state.misses += 1
        result = await super().get(key, prototype, byte_range)
        await self._cache_miss(key, byte_range, result)
        return result

    async def get(
        self,
        key: str,
        prototype: BufferPrototype,
        byte_range: ByteRequest | None = None,
    ) -> Buffer | None:
        """
        Retrieve data from the store, using cache when appropriate.

        Parameters
        ----------
        key : str
            The key to retrieve
        prototype : BufferPrototype
            Buffer prototype for creating the result buffer
        byte_range : ByteRequest, optional
            Byte range to retrieve

        Returns
        -------
        Buffer | None
            The retrieved data, or None if not found
        """
        entry_key: _CacheEntryKey = (key, byte_range) if byte_range is not None else key
        if not self._is_key_fresh(entry_key):
            return await self._get_no_cache(key, prototype, byte_range)
        else:
            return await self._get_try_cache(key, prototype, byte_range)

    async def set(self, key: str, value: Buffer) -> None:
        """
        Store data in the underlying store and optionally in cache.

        Parameters
        ----------
        key : str
            The key to store under
        value : Buffer
            The data to store
        """
        await super().set(key, value)
        # Invalidate all cached byte-range entries (source data changed)
        async with self._state.lock:
            self._invalidate_range_entries(key)
        if self.cache_set_data:
            await self._cache.set(key, value)
            await self._track_entry(key, value)
        else:
            await self._cache.delete(key)
            async with self._state.lock:
                self._remove_from_tracking(key)

    async def delete(self, key: str) -> None:
        """
        Delete data from both the underlying store and cache.

        Parameters
        ----------
        key : str
            The key to delete
        """
        await super().delete(key)
        # Invalidate all cached byte-range entries
        async with self._state.lock:
            self._invalidate_range_entries(key)
        await self._cache.delete(key)
        async with self._state.lock:
            self._remove_from_tracking(key)

    def cache_info(self) -> dict[str, Any]:
        """Return information about the cache state."""
        return {
            "cache_store_type": type(self._cache).__name__,
            "max_age_seconds": "infinity"
            if self.max_age_seconds == "infinity"
            else self.max_age_seconds,
            "max_size": self.max_size,
            "current_size": self._state.current_size,
            "cache_set_data": self.cache_set_data,
            "tracked_keys": len(self._state.key_insert_times),
            "cached_keys": len(self._state.cache_order),
        }

    def cache_stats(self) -> dict[str, Any]:
        """Return cache performance statistics."""
        total_requests = self._state.hits + self._state.misses
        hit_rate = self._state.hits / total_requests if total_requests > 0 else 0.0
        return {
            "hits": self._state.hits,
            "misses": self._state.misses,
            "evictions": self._state.evictions,
            "total_requests": total_requests,
            "hit_rate": hit_rate,
        }

    async def clear_cache(self) -> None:
        """Clear all cached data and tracking information."""
        # Clear the cache store if it supports clear
        if hasattr(self._cache, "clear"):
            await self._cache.clear()

        # Reset tracking
        async with self._state.lock:
            self._state.key_insert_times.clear()
            self._state.cache_order.clear()
            self._state.key_sizes.clear()
            self._state.range_cache.clear()
            self._state.current_size = 0

    def __repr__(self) -> str:
        """Return string representation of the cache store."""
        return (
            f"{self.__class__.__name__}("
            f"store={self._store!r}, "
            f"cache_store={self._cache!r}, "
            f"max_age_seconds={self.max_age_seconds}, "
            f"max_size={self.max_size}, "
            f"current_size={self._state.current_size}, "
            f"cached_keys={len(self._state.cache_order)})"
        )

cache_set_data `instance-attribute` ¶

cache_set_data: bool = cache_set_data

max_age_seconds `instance-attribute` ¶

max_age_seconds: int | Literal['infinity']

max_size `instance-attribute` ¶

max_size: int | None = max_size

read_only `property` ¶

read_only: bool

Is the store read-only?

supports_consolidated_metadata `property` ¶

supports_consolidated_metadata: bool

Does the store support consolidated metadata?.

If it doesn't an error will be raised on requests to consolidate the metadata. Returning False can be useful for stores which implement their own consolidation mechanism outside of the zarr-python implementation.

supports_deletes `property` ¶

supports_deletes: bool

Does the store support deletes?

supports_listing `property` ¶

supports_listing: bool

Does the store support listing?

supports_partial_writes `property` ¶

supports_partial_writes: Literal[False]

Does the store support partial writes?

Partial writes are no longer used by Zarr, so this is always false.

supports_writes `property` ¶

supports_writes: bool

Does the store support writes?

enter ¶

__enter__() -> Self

Enter a context manager that will close the store upon exiting.

Source code in zarr/storage/_wrapper.py

def __enter__(self) -> Self:
    return self._with_store(self._store.__enter__())

eq ¶

__eq__(value: object) -> bool

Equality comparison.

Source code in zarr/storage/_wrapper.py

def __eq__(self, value: object) -> bool:
    return type(self) is type(value) and self._store.__eq__(value._store)  # type: ignore[attr-defined]

exit ¶

__exit__(
    exc_type: type[BaseException] | None,
    exc_value: BaseException | None,
    traceback: TracebackType | None,
) -> None

Close the store.

Source code in zarr/storage/_wrapper.py

def __exit__(
    self,
    exc_type: type[BaseException] | None,
    exc_value: BaseException | None,
    traceback: TracebackType | None,
) -> None:
    return self._store.__exit__(exc_type, exc_value, traceback)

init ¶

__init__(
    store: Store,
    *,
    cache_store: Store,
    max_age_seconds: int | str = "infinity",
    max_size: int | None = None,
    cache_set_data: bool = True,
) -> None

Source code in zarr/experimental/cache_store.py

def __init__(
    self,
    store: Store,
    *,
    cache_store: Store,
    max_age_seconds: int | str = "infinity",
    max_size: int | None = None,
    cache_set_data: bool = True,
) -> None:
    super().__init__(store)

    if not cache_store.supports_deletes:
        msg = (
            f"The provided cache store {cache_store} does not support deletes. "
            "The cache_store must support deletes for CacheStore to function properly."
        )
        raise ValueError(msg)

    self._cache = cache_store
    # Validate and set max_age_seconds
    if isinstance(max_age_seconds, str):
        if max_age_seconds != "infinity":
            raise ValueError("max_age_seconds string value must be 'infinity'")
        self.max_age_seconds = "infinity"
    else:
        self.max_age_seconds = max_age_seconds
    self.max_size = max_size
    self.cache_set_data = cache_set_data
    self._state = _CacheState()

repr ¶

__repr__() -> str

Return string representation of the cache store.

Source code in zarr/experimental/cache_store.py

def __repr__(self) -> str:
    """Return string representation of the cache store."""
    return (
        f"{self.__class__.__name__}("
        f"store={self._store!r}, "
        f"cache_store={self._cache!r}, "
        f"max_age_seconds={self.max_age_seconds}, "
        f"max_size={self.max_size}, "
        f"current_size={self._state.current_size}, "
        f"cached_keys={len(self._state.cache_order)})"
    )

str ¶

__str__() -> str

Source code in zarr/storage/_wrapper.py

def __str__(self) -> str:
    return f"wrapping-{self._store}"

cache_info ¶

cache_info() -> dict[str, Any]

Return information about the cache state.

Source code in zarr/experimental/cache_store.py

def cache_info(self) -> dict[str, Any]:
    """Return information about the cache state."""
    return {
        "cache_store_type": type(self._cache).__name__,
        "max_age_seconds": "infinity"
        if self.max_age_seconds == "infinity"
        else self.max_age_seconds,
        "max_size": self.max_size,
        "current_size": self._state.current_size,
        "cache_set_data": self.cache_set_data,
        "tracked_keys": len(self._state.key_insert_times),
        "cached_keys": len(self._state.cache_order),
    }

cache_stats ¶

cache_stats() -> dict[str, Any]

Return cache performance statistics.

Source code in zarr/experimental/cache_store.py

def cache_stats(self) -> dict[str, Any]:
    """Return cache performance statistics."""
    total_requests = self._state.hits + self._state.misses
    hit_rate = self._state.hits / total_requests if total_requests > 0 else 0.0
    return {
        "hits": self._state.hits,
        "misses": self._state.misses,
        "evictions": self._state.evictions,
        "total_requests": total_requests,
        "hit_rate": hit_rate,
    }

clear `async` ¶

clear() -> None

Clear the store.

Remove all keys and values from the store.

Source code in zarr/storage/_wrapper.py

async def clear(self) -> None:
    return await self._store.clear()

clear_cache `async` ¶

clear_cache() -> None

Clear all cached data and tracking information.

Source code in zarr/experimental/cache_store.py

async def clear_cache(self) -> None:
    """Clear all cached data and tracking information."""
    # Clear the cache store if it supports clear
    if hasattr(self._cache, "clear"):
        await self._cache.clear()

    # Reset tracking
    async with self._state.lock:
        self._state.key_insert_times.clear()
        self._state.cache_order.clear()
        self._state.key_sizes.clear()
        self._state.range_cache.clear()
        self._state.current_size = 0

close ¶

close() -> None

Close the store.

Source code in zarr/storage/_wrapper.py

def close(self) -> None:
    self._store.close()

delete `async` ¶

delete(key: str) -> None

Delete data from both the underlying store and cache.

Parameters:

key (str) –

The key to delete

Source code in zarr/experimental/cache_store.py

async def delete(self, key: str) -> None:
    """
    Delete data from both the underlying store and cache.

    Parameters
    ----------
    key : str
        The key to delete
    """
    await super().delete(key)
    # Invalidate all cached byte-range entries
    async with self._state.lock:
        self._invalidate_range_entries(key)
    await self._cache.delete(key)
    async with self._state.lock:
        self._remove_from_tracking(key)

delete_dir `async` ¶

delete_dir(prefix: str) -> None

Remove all keys and prefixes in the store that begin with a given prefix.

Source code in zarr/storage/_wrapper.py

async def delete_dir(self, prefix: str) -> None:
    return await self._store.delete_dir(prefix)

exists `async` ¶

exists(key: str) -> bool

Check if a key exists in the store.

Parameters:

key (str) –

Returns:

bool –

Source code in zarr/storage/_wrapper.py

async def exists(self, key: str) -> bool:
    return await self._store.exists(key)

get `async` ¶

get(
    key: str,
    prototype: BufferPrototype,
    byte_range: ByteRequest | None = None,
) -> Buffer | None

Retrieve data from the store, using cache when appropriate.

Parameters:

key (str) –

The key to retrieve
prototype (BufferPrototype) –

Buffer prototype for creating the result buffer
byte_range (ByteRequest, default: None ) –

Byte range to retrieve

Returns:

Buffer | None –

The retrieved data, or None if not found

Source code in zarr/experimental/cache_store.py

async def get(
    self,
    key: str,
    prototype: BufferPrototype,
    byte_range: ByteRequest | None = None,
) -> Buffer | None:
    """
    Retrieve data from the store, using cache when appropriate.

    Parameters
    ----------
    key : str
        The key to retrieve
    prototype : BufferPrototype
        Buffer prototype for creating the result buffer
    byte_range : ByteRequest, optional
        Byte range to retrieve

    Returns
    -------
    Buffer | None
        The retrieved data, or None if not found
    """
    entry_key: _CacheEntryKey = (key, byte_range) if byte_range is not None else key
    if not self._is_key_fresh(entry_key):
        return await self._get_no_cache(key, prototype, byte_range)
    else:
        return await self._get_try_cache(key, prototype, byte_range)

get_partial_values `async` ¶

get_partial_values(
    prototype: BufferPrototype,
    key_ranges: Iterable[tuple[str, ByteRequest | None]],
) -> list[Buffer | None]

Retrieve possibly partial values from given key_ranges.

Parameters:

prototype (BufferPrototype) –

The prototype of the output buffer. Stores may support a default buffer prototype.
key_ranges (Iterable[tuple[str, tuple[int | None, int | None]]]) –

Ordered set of key, range pairs, a key may occur multiple times with different ranges

Returns:

list of values, in the order of the key_ranges, may contain null/none for missing keys –

Source code in zarr/storage/_wrapper.py

async def get_partial_values(
    self,
    prototype: BufferPrototype,
    key_ranges: Iterable[tuple[str, ByteRequest | None]],
) -> list[Buffer | None]:
    return await self._store.get_partial_values(prototype, key_ranges)

getsize `async` ¶

getsize(key: str) -> int

Return the size, in bytes, of a value in a Store.

Parameters:

key (str) –

Returns:

nbytes ( int ) –

The size of the value (in bytes).

Raises:

FileNotFoundError –

When the given key does not exist in the store.

Source code in zarr/abc/store.py

async def getsize(self, key: str) -> int:
    """
    Return the size, in bytes, of a value in a Store.

    Parameters
    ----------
    key : str

    Returns
    -------
    nbytes : int
        The size of the value (in bytes).

    Raises
    ------
    FileNotFoundError
        When the given key does not exist in the store.
    """
    # Note to implementers: this default implementation is very inefficient since
    # it requires reading the entire object. Many systems will have ways to get the
    # size of an object without reading it.
    # avoid circular import
    from zarr.core.buffer.core import default_buffer_prototype

    value = await self.get(key, prototype=default_buffer_prototype())
    if value is None:
        raise FileNotFoundError(key)
    return len(value)

getsize_prefix `async` ¶

getsize_prefix(prefix: str) -> int

Return the size, in bytes, of all values under a prefix.

Parameters:

prefix (str) –

The prefix of the directory to measure.

Returns:

nbytes ( int ) –

The sum of the sizes of the values in the directory (in bytes).

is_empty `async` ¶

is_empty(prefix: str) -> bool

Check if the directory is empty.

Parameters:

prefix (str) –

Prefix of keys to check.

Returns:

bool –

True if the store is empty, False otherwise.

Source code in zarr/storage/_wrapper.py

async def is_empty(self, prefix: str) -> bool:
    return await self._store.is_empty(prefix)

list ¶

list() -> AsyncIterator[str]

Retrieve all keys in the store.

Returns:

AsyncIterator[str] –

Source code in zarr/storage/_wrapper.py

def list(self) -> AsyncIterator[str]:
    return self._store.list()

list_dir ¶

list_dir(prefix: str) -> AsyncIterator[str]

Retrieve all keys and prefixes with a given prefix and which do not contain the character “/” after the given prefix.

Parameters:

prefix (str) –

Returns:

AsyncIterator[str] –

Source code in zarr/storage/_wrapper.py

def list_dir(self, prefix: str) -> AsyncIterator[str]:
    return self._store.list_dir(prefix)

list_prefix ¶

list_prefix(prefix: str) -> AsyncIterator[str]

Retrieve all keys in the store that begin with a given prefix. Keys are returned relative to the root of the store.

Parameters:

prefix (str) –

Returns:

AsyncIterator[str] –

Source code in zarr/storage/_wrapper.py

def list_prefix(self, prefix: str) -> AsyncIterator[str]:
    return self._store.list_prefix(prefix)

open `async` `classmethod` ¶

open(
    store_cls: type[T_Store], *args: Any, **kwargs: Any
) -> Self

Create and open the store.

Parameters:

*args (Any, default: () ) –

Positional arguments to pass to the store constructor.
**kwargs (Any, default: {} ) –

Keyword arguments to pass to the store constructor.

Returns:

Store –

The opened store instance.

Source code in zarr/storage/_wrapper.py

@classmethod
async def open(cls: type[Self], store_cls: type[T_Store], *args: Any, **kwargs: Any) -> Self:
    store = store_cls(*args, **kwargs)
    await store._open()
    return cls(store=store)

set `async` ¶

set(key: str, value: Buffer) -> None

Store data in the underlying store and optionally in cache.

Parameters:

key (str) –

The key to store under
value (Buffer) –

The data to store

Source code in zarr/experimental/cache_store.py

async def set(self, key: str, value: Buffer) -> None:
    """
    Store data in the underlying store and optionally in cache.

    Parameters
    ----------
    key : str
        The key to store under
    value : Buffer
        The data to store
    """
    await super().set(key, value)
    # Invalidate all cached byte-range entries (source data changed)
    async with self._state.lock:
        self._invalidate_range_entries(key)
    if self.cache_set_data:
        await self._cache.set(key, value)
        await self._track_entry(key, value)
    else:
        await self._cache.delete(key)
        async with self._state.lock:
            self._remove_from_tracking(key)

set_if_not_exists `async` ¶

set_if_not_exists(key: str, value: Buffer) -> None

Store a key to value if the key is not already present.

Parameters:

key (str) –
value (Buffer) –

Source code in zarr/storage/_wrapper.py

async def set_if_not_exists(self, key: str, value: Buffer) -> None:
    return await self._store.set_if_not_exists(key, value)

with_read_only ¶

with_read_only(read_only: bool = False) -> Self

Return a new store with a new read_only setting.

The new store points to the same location with the specified new read_only state. The returned Store is not automatically opened, and this store is not automatically closed.

Parameters:

read_only (bool, default: False ) –

If True, the store will be created in read-only mode. Defaults to False.

Returns:

A new store of the same type with the new read only attribute. –

Source code in zarr/experimental/cache_store.py

def with_read_only(self, read_only: bool = False) -> Self:
    # Create a new cache store that shares the same cache and mutable state
    store = type(self)(
        store=self._store.with_read_only(read_only),
        cache_store=self._cache,
        max_age_seconds=self.max_age_seconds,
        max_size=self.max_size,
        cache_set_data=self.cache_set_data,
    )
    store._state = self._state
    return store

experimental

Classes¶

zarr.experimental.cache_store ¶

logger module-attribute ¶

CacheStore ¶

cache_set_data instance-attribute ¶

max_age_seconds instance-attribute ¶

max_size instance-attribute ¶

read_only property ¶

supports_consolidated_metadata property ¶

supports_deletes property ¶

supports_listing property ¶

supports_partial_writes property ¶

supports_writes property ¶

__enter__ ¶

__eq__ ¶

__exit__ ¶

__init__ ¶

__repr__ ¶

__str__ ¶

cache_info ¶

cache_stats ¶

clear async ¶

clear_cache async ¶

close ¶

delete async ¶

delete_dir async ¶

exists async ¶

get async ¶

get_partial_values async ¶

getsize async ¶

getsize_prefix async ¶

is_empty async ¶

list ¶

list_dir ¶

list_prefix ¶

open async classmethod ¶

set async ¶

set_if_not_exists async ¶

with_read_only ¶

logger `module-attribute` ¶

cache_set_data `instance-attribute` ¶

max_age_seconds `instance-attribute` ¶

max_size `instance-attribute` ¶

read_only `property` ¶

supports_consolidated_metadata `property` ¶

supports_deletes `property` ¶

supports_listing `property` ¶

supports_partial_writes `property` ¶

supports_writes `property` ¶

enter ¶

eq ¶

exit ¶

init ¶

repr ¶

str ¶

clear `async` ¶

clear_cache `async` ¶

delete `async` ¶

delete_dir `async` ¶

exists `async` ¶

get `async` ¶

get_partial_values `async` ¶

getsize `async` ¶

getsize_prefix `async` ¶

is_empty `async` ¶

open `async` `classmethod` ¶

set `async` ¶

set_if_not_exists `async` ¶