From 22341c8b06dfa0c53e68847ed25b9898b4aa1890 Mon Sep 17 00:00:00 2001 From: sneakers-the-rat Date: Fri, 13 Dec 2024 17:53:20 -0800 Subject: [PATCH 1/5] correctly failing tests for np.str_ in a tuple --- src/numpydantic/testing/cases.py | 21 +++++++++++++++++++++ src/numpydantic/testing/interfaces.py | 4 +++- 2 files changed, 24 insertions(+), 1 deletion(-) diff --git a/src/numpydantic/testing/cases.py b/src/numpydantic/testing/cases.py index 042317d..4f715fd 100644 --- a/src/numpydantic/testing/cases.py +++ b/src/numpydantic/testing/cases.py @@ -126,6 +126,27 @@ DTYPE_CASES = [ ValidationCase(annotation_dtype=str, dtype=str, passes=True, id="str-str"), ValidationCase(annotation_dtype=str, dtype=int, passes=False, id="str-int"), ValidationCase(annotation_dtype=str, dtype=float, passes=False, id="str-float"), + ValidationCase( + annotation_dtype=np.str_, + dtype=str, + passes=True, + id="np_str-str", + marks={"np_str", "str"}, + ), + ValidationCase( + annotation_dtype=np.str_, + dtype=np.str_, + passes=True, + id="np_str-np_str", + marks={"np_str", "str"}, + ), + ValidationCase( + annotation_dtype=(int, np.str_), + dtype=str, + passes=True, + id="tuple_np_str-str", + marks={"np_str", "str", "tuple"}, + ), ValidationCase( annotation_dtype=BasicModel, dtype=BasicModel, passes=True, id="model-model" ), diff --git a/src/numpydantic/testing/interfaces.py b/src/numpydantic/testing/interfaces.py index a11bc6a..c247169 100644 --- a/src/numpydantic/testing/interfaces.py +++ b/src/numpydantic/testing/interfaces.py @@ -75,6 +75,8 @@ class HDF5Case(_HDF5MetaCase): data = np.array(array, dtype=dtype) elif dtype is str: data = generator.random(shape).astype(bytes) + elif dtype is np.str_: + data = generator.random(shape).astype("S32") elif dtype is datetime: data = np.empty(shape, dtype="S32") data.fill(datetime.now(timezone.utc).isoformat().encode("utf-8")) @@ -106,7 +108,7 @@ class HDF5CompoundCase(_HDF5MetaCase): array_path = "/" + "_".join([str(s) for s in shape]) + "__" + dtype.__name__ if array is not None: data = np.array(array, dtype=dtype) - elif dtype is str: + elif dtype in (str, np.str_): dt = np.dtype([("data", np.dtype("S10")), ("extra", "i8")]) data = np.array([("hey", 0)] * np.prod(shape), dtype=dt).reshape(shape) elif dtype is datetime: From e942da4becaba1c3c548ea864712cfce567506b9 Mon Sep 17 00:00:00 2001 From: sneakers-the-rat Date: Fri, 13 Dec 2024 17:55:35 -0800 Subject: [PATCH 2/5] recursively validate tuples instead of simple containment checking --- src/numpydantic/validation/dtype.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/numpydantic/validation/dtype.py b/src/numpydantic/validation/dtype.py index 5eeb124..d9b2790 100644 --- a/src/numpydantic/validation/dtype.py +++ b/src/numpydantic/validation/dtype.py @@ -32,7 +32,7 @@ def validate_dtype(dtype: Any, target: DtypeType) -> bool: return True if isinstance(target, tuple): - valid = dtype in target + valid = any(validate_dtype(dtype, target_dt) for target_dt in target) elif is_union(target): valid = any( [validate_dtype(dtype, target_dt) for target_dt in get_args(target)] From 616785e6ed4f8f7921a11cf2b0b624550f84b296 Mon Sep 17 00:00:00 2001 From: sneakers-the-rat Date: Fri, 13 Dec 2024 18:08:16 -0800 Subject: [PATCH 3/5] zarr roundtripping strings to/from json --- src/numpydantic/interface/zarr.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/src/numpydantic/interface/zarr.py b/src/numpydantic/interface/zarr.py index 2e3d993..2a1e9c3 100644 --- a/src/numpydantic/interface/zarr.py +++ b/src/numpydantic/interface/zarr.py @@ -74,7 +74,8 @@ class ZarrJsonDict(JsonDict): if self.file: array = ZarrArrayPath(file=self.file, path=self.path) else: - array = zarr.array(self.value, dtype=self.dtype) + dtype = np.str_ if self.dtype == "str" else self.dtype + array = zarr.array(self.value, dtype=dtype) return array From 4fe3a72db55cbc160004666ba95de74bf01a7bbf Mon Sep 17 00:00:00 2001 From: sneakers-the-rat Date: Fri, 13 Dec 2024 18:12:00 -0800 Subject: [PATCH 4/5] changelog --- docs/changelog.md | 7 +++++++ 1 file changed, 7 insertions(+) diff --git a/docs/changelog.md b/docs/changelog.md index e2ddc40..5253d60 100644 --- a/docs/changelog.md +++ b/docs/changelog.md @@ -8,6 +8,11 @@ An additional check was added for presence of `__name__` when embedding. - `NDArray` types were incorrectly cached s.t. pipe-union dtypes were considered equivalent to `Union[]` dtypes. An additional tuple with the type of the args was added to the cache key to disambiguate them. +- [#38](https://github.com/p2p-ld/numpydantic/issues/38), [#40](https://github.com/p2p-ld/numpydantic/pull/40) - + - Tuple dtypes were naively checked by just testing for whether the given dtype was contained by the tuple, + ignoring special cases like string type checking. Tuple dtypes are now checked recursively with the same + logic as all other type checking. + - Zarr treats `dtype=str` as numpy type `O` - added special case when validating from JSON to cast to `np.str_` **Testing** - [#39](https://github.com/p2p-ld/numpydantic/pull/39) - Test that all combinations of shapes, dtypes, and interfaces @@ -15,6 +20,8 @@ - [#39](https://github.com/p2p-ld/numpydantic/pull/39) - Add python 3.13 to the testing matrix. - [#39](https://github.com/p2p-ld/numpydantic/pull/39) - Add an additional `marks` field to ValidationCase for finer-grained control over running tests. +- [#40](https://github.com/p2p-ld/numpydantic/pull/40) - Explicitly test for `np.str_` annotation dtypes alone and + in tuples. ## 1.* From f90df3032479c65c477d6da6932e7ecd4b876891 Mon Sep 17 00:00:00 2001 From: sneakers-the-rat Date: Fri, 13 Dec 2024 18:14:24 -0800 Subject: [PATCH 5/5] bump version, move changelog into place --- docs/changelog.md | 10 +++++----- pyproject.toml | 2 +- 2 files changed, 6 insertions(+), 6 deletions(-) diff --git a/docs/changelog.md b/docs/changelog.md index 5253d60..0e0dcc2 100644 --- a/docs/changelog.md +++ b/docs/changelog.md @@ -1,6 +1,10 @@ # Changelog -## Upcoming +## 1.* + +### 1.6.* + +#### 1.6.6 - 24-12-13 **Bugfix** - [#38](https://github.com/p2p-ld/numpydantic/issues/38), [#39](https://github.com/p2p-ld/numpydantic/pull/39) - @@ -23,10 +27,6 @@ - [#40](https://github.com/p2p-ld/numpydantic/pull/40) - Explicitly test for `np.str_` annotation dtypes alone and in tuples. -## 1.* - -### 1.6.* - #### 1.6.5 - 24-12-04 - Bump Pydantic Minimum **Bugfix** diff --git a/pyproject.toml b/pyproject.toml index 36c7220..dc585d4 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -1,6 +1,6 @@ [project] name = "numpydantic" -version = "1.6.5" +version = "1.6.6" description = "Type and shape validation and serialization for arbitrary array types in pydantic models" authors = [ {name = "sneakers-the-rat", email = "sneakers-the-rat@protonmail.com"},