Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 0 additions & 1 deletion pyproject.toml
Original file line number Diff line number Diff line change
Expand Up @@ -241,7 +241,6 @@ module = [
"zarr.array",
"zarr.common",
"zarr.group",
"zarr.metadata"
]
disallow_untyped_defs = false

Expand Down
2 changes: 2 additions & 0 deletions src/zarr/array.py
Original file line number Diff line number Diff line change
Expand Up @@ -199,6 +199,8 @@ async def _create_v3(

if chunk_key_encoding is None:
chunk_key_encoding = ("default", "/")
assert chunk_key_encoding is not None

if isinstance(chunk_key_encoding, tuple):
chunk_key_encoding = (
V2ChunkKeyEncoding(separator=chunk_key_encoding[1])
Expand Down
8 changes: 4 additions & 4 deletions src/zarr/chunk_grids.py
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,7 @@
import itertools
from collections.abc import Iterator
from dataclasses import dataclass
from typing import TYPE_CHECKING, Any
from typing import TYPE_CHECKING

from zarr.abc.metadata import Metadata
from zarr.common import (
Expand All @@ -22,13 +22,13 @@
@dataclass(frozen=True)
class ChunkGrid(Metadata):
@classmethod
def from_dict(cls, data: dict[str, JSON]) -> ChunkGrid:
def from_dict(cls, data: dict[str, JSON] | ChunkGrid) -> ChunkGrid:
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

your change is fine but I don't know why from_dict accepts a ChunkGrid object. 🤷

if isinstance(data, ChunkGrid):
return data

name_parsed, _ = parse_named_configuration(data)
if name_parsed == "regular":
return RegularChunkGrid.from_dict(data)
return RegularChunkGrid._from_dict(data)
raise ValueError(f"Unknown chunk grid. Got {name_parsed}.")

def all_chunk_coords(self, array_shape: ChunkCoords) -> Iterator[ChunkCoords]:
Expand All @@ -45,7 +45,7 @@ def __init__(self, *, chunk_shape: ChunkCoordsLike) -> None:
object.__setattr__(self, "chunk_shape", chunk_shape_parsed)

@classmethod
def from_dict(cls, data: dict[str, Any]) -> Self:
def _from_dict(cls, data: dict[str, JSON]) -> Self:
_, configuration_parsed = parse_named_configuration(data, "regular")

return cls(**configuration_parsed) # type: ignore[arg-type]
Expand Down
2 changes: 1 addition & 1 deletion src/zarr/chunk_key_encodings.py
Original file line number Diff line number Diff line change
Expand Up @@ -34,7 +34,7 @@ def __init__(self, *, separator: SeparatorLiteral) -> None:
object.__setattr__(self, "separator", separator_parsed)

@classmethod
def from_dict(cls, data: dict[str, JSON]) -> ChunkKeyEncoding:
def from_dict(cls, data: dict[str, JSON] | ChunkKeyEncoding) -> ChunkKeyEncoding:
if isinstance(data, ChunkKeyEncoding):
return data

Expand Down
5 changes: 3 additions & 2 deletions src/zarr/common.py
Original file line number Diff line number Diff line change
Expand Up @@ -13,6 +13,7 @@
from collections.abc import Awaitable, Callable, Iterator

import numpy as np
import numpy.typing as npt

ZARR_JSON = "zarr.json"
ZARRAY_JSON = ".zarray"
Expand Down Expand Up @@ -150,7 +151,7 @@ def parse_named_configuration(
return name_parsed, configuration_parsed


def parse_shapelike(data: Any) -> tuple[int, ...]:
def parse_shapelike(data: Iterable[int]) -> tuple[int, ...]:
if not isinstance(data, Iterable):
raise TypeError(f"Expected an iterable. Got {data} instead.")
data_tuple = tuple(data)
Expand All @@ -164,7 +165,7 @@ def parse_shapelike(data: Any) -> tuple[int, ...]:
return data_tuple


def parse_dtype(data: Any) -> np.dtype[Any]:
def parse_dtype(data: npt.DTypeLike) -> np.dtype[Any]:
# todo: real validation
return np.dtype(data)

Expand Down
41 changes: 22 additions & 19 deletions src/zarr/metadata.py
Original file line number Diff line number Diff line change
Expand Up @@ -22,6 +22,7 @@

from typing_extensions import Self

import numcodecs.abc

from zarr.common import (
JSON,
Expand Down Expand Up @@ -168,15 +169,15 @@ class ArrayV3Metadata(ArrayMetadata):
def __init__(
self,
*,
shape,
data_type,
chunk_grid,
chunk_key_encoding,
fill_value,
codecs,
attributes,
dimension_names,
):
shape: Iterable[int],
data_type: npt.DTypeLike,
chunk_grid: dict[str, JSON] | ChunkGrid,
chunk_key_encoding: dict[str, JSON] | ChunkKeyEncoding,
fill_value: Any,
codecs: Iterable[Codec | JSON],
attributes: None | dict[str, JSON],
dimension_names: None | Iterable[str],
) -> None:
"""
Because the class is a frozen dataclass, we set attributes using object.__setattr__
"""
Expand Down Expand Up @@ -249,14 +250,14 @@ def encode_chunk_key(self, chunk_coords: ChunkCoords) -> str:
return self.chunk_key_encoding.encode_chunk_key(chunk_coords)

def to_buffer_dict(self) -> dict[str, Buffer]:
def _json_convert(o):
def _json_convert(o: np.dtype[Any] | Enum | Codec) -> str | dict[str, Any]:
if isinstance(o, np.dtype):
return str(o)
if isinstance(o, Enum):
return o.name
# this serializes numcodecs compressors
# todo: implement to_dict for codecs
elif hasattr(o, "get_config"):
elif isinstance(o, numcodecs.abc.Codec):
return o.get_config()
raise TypeError

Expand All @@ -271,9 +272,10 @@ def from_dict(cls, data: dict[str, JSON]) -> ArrayV3Metadata:
# check that the node_type attribute is correct
_ = parse_node_type_array(data.pop("node_type"))

dimension_names = data.pop("dimension_names", None)
data["dimension_names"] = data.pop("dimension_names", None)

return cls(**data, dimension_names=dimension_names)
# TODO: Remove the ignores and use a TypedDict to type `data`
return cls(**data) # type: ignore[arg-type]

def to_dict(self) -> dict[str, Any]:
out_dict = super().to_dict()
Expand Down Expand Up @@ -367,7 +369,9 @@ def codec_pipeline(self) -> CodecPipeline:
)

def to_buffer_dict(self) -> dict[str, Buffer]:
def _json_convert(o):
def _json_convert(
o: np.dtype[Any],
) -> str | list[tuple[str, str] | tuple[str, str, tuple[int, ...]]]:
if isinstance(o, np.dtype):
if o.fields is None:
return o.str
Expand Down Expand Up @@ -399,7 +403,7 @@ def to_dict(self) -> JSON:
zarray_dict["chunks"] = self.chunk_grid.chunk_shape

_ = zarray_dict.pop("data_type")
zarray_dict["dtype"] = self.data_type
zarray_dict["dtype"] = self.data_type.str

return zarray_dict

Expand All @@ -422,7 +426,7 @@ def update_attributes(self, attributes: dict[str, JSON]) -> Self:
return replace(self, attributes=attributes)


def parse_dimension_names(data: Any) -> tuple[str, ...] | None:
def parse_dimension_names(data: None | Iterable[str]) -> tuple[str, ...] | None:
if data is None:
return data
if isinstance(data, Iterable) and all([isinstance(x, str) for x in data]):
Expand All @@ -432,12 +436,11 @@ def parse_dimension_names(data: Any) -> tuple[str, ...] | None:


# todo: real validation
def parse_attributes(data: Any) -> dict[str, JSON]:
def parse_attributes(data: None | dict[str, JSON]) -> dict[str, JSON]:
if data is None:
return {}

data_json = cast(dict[str, JSON], data)
return data_json
return data


# todo: move to its own module and drop _v3 suffix
Expand Down