bioimage-io · FynnBe · Mar 31, 2025 · Apr 2, 2025 · Apr 2, 2025 · Apr 2, 2025
diff --git a/.github/workflows/build.yaml b/.github/workflows/build.yaml
@@ -174,7 +174,7 @@ jobs:
         path: bioimageio_cache
         key: ${{matrix.run-expensive-tests && needs.populate-cache.outputs.cache-key || needs.populate-cache.outputs.cache-key-light}}
     - name: pytest
-      run: pytest --disable-pytest-warnings
+      run: pytest --cov bioimageio --cov-report xml --cov-append --capture no --disable-pytest-warnings
       env:
         BIOIMAGEIO_CACHE_PATH: bioimageio_cache
         RUN_EXPENSIVE_TESTS: ${{ matrix.run-expensive-tests && 'true' || 'false' }}

diff --git a/bioimageio/core/__init__.py b/bioimageio/core/__init__.py
@@ -3,6 +3,7 @@
 """
 
 from bioimageio.spec import (
+    ValidationSummary,
     build_description,
     dump_description,
     load_dataset_description,
@@ -112,4 +113,5 @@
     "test_model",
     "test_resource",
     "validate_format",
+    "ValidationSummary",
 ]
diff --git a/bioimageio/core/backends/keras_backend.py b/bioimageio/core/backends/keras_backend.py
@@ -4,17 +4,18 @@
 from loguru import logger
 from numpy.typing import NDArray
 
-from bioimageio.spec._internal.io import download
-from bioimageio.spec._internal.type_guards import is_list, is_tuple
 from bioimageio.spec.model import v0_4, v0_5
 from bioimageio.spec.model.v0_5 import Version
+from bioimageio.spec.utils import download
 
 from .._settings import settings
 from ..digest_spec import get_axes_infos
+from ..utils._type_guards import is_list, is_tuple
 from ._model_adapter import ModelAdapter
 
 os.environ["KERAS_BACKEND"] = settings.keras_backend
 
+
 # by default, we use the keras integrated with tensorflow
 # TODO: check if we should prefer keras
 try:

diff --git a/bioimageio/core/backends/onnx_backend.py b/bioimageio/core/backends/onnx_backend.py
@@ -5,11 +5,11 @@
 import onnxruntime as rt  # pyright: ignore[reportMissingTypeStubs]
 from numpy.typing import NDArray
 
-from bioimageio.spec._internal.type_guards import is_list, is_tuple
 from bioimageio.spec.model import v0_4, v0_5
 from bioimageio.spec.utils import download
 
 from ..model_adapters import ModelAdapter
+from ..utils._type_guards import is_list, is_tuple
 
 
 class ONNXModelAdapter(ModelAdapter):

diff --git a/bioimageio/core/backends/pytorch_backend.py b/bioimageio/core/backends/pytorch_backend.py
@@ -11,12 +11,13 @@
 from torch import nn
 from typing_extensions import assert_never
 
-from bioimageio.spec._internal.type_guards import is_list, is_ndarray, is_tuple
+from bioimageio.spec._internal.version_type import Version
 from bioimageio.spec.common import ZipPath
 from bioimageio.spec.model import AnyModelDescr, v0_4, v0_5
 from bioimageio.spec.utils import download
 
 from ..digest_spec import import_callable
+from ..utils._type_guards import is_list, is_ndarray, is_tuple
 from ._model_adapter import ModelAdapter
 
 
@@ -143,7 +144,10 @@ def load_torch_state_dict(
     model = model.to(devices[0])
     with path.open("rb") as f:
         assert not isinstance(f, TextIOWrapper)
-        state = torch.load(f, map_location=devices[0], weights_only=True)
+        if Version(str(torch.__version__)) < Version("1.13"):
+            state = torch.load(f, map_location=devices[0])
+        else:
+            state = torch.load(f, map_location=devices[0], weights_only=True)
 
     incompatible = model.load_state_dict(state)
     if (

diff --git a/bioimageio/core/backends/torchscript_backend.py b/bioimageio/core/backends/torchscript_backend.py
@@ -6,11 +6,11 @@
 import torch
 from numpy.typing import NDArray
 
-from bioimageio.spec._internal.type_guards import is_list, is_tuple
 from bioimageio.spec.model import v0_4, v0_5
 from bioimageio.spec.utils import download
 
 from ..model_adapters import ModelAdapter
+from ..utils._type_guards import is_list, is_tuple
 
 
 class TorchscriptModelAdapter(ModelAdapter):

diff --git a/bioimageio/core/io.py b/bioimageio/core/io.py
@@ -1,7 +1,6 @@
 import collections.abc
 import warnings
 import zipfile
-from io import TextIOWrapper
 from pathlib import Path, PurePosixPath
 from shutil import copyfileobj
 from typing import (
@@ -15,15 +14,16 @@
 )
 
 import h5py  # pyright: ignore[reportMissingTypeStubs]
-import numpy as np
 from imageio.v3 import imread, imwrite  # type: ignore
 from loguru import logger
 from numpy.typing import NDArray
 from pydantic import BaseModel, ConfigDict, TypeAdapter
 from typing_extensions import assert_never
 
-from bioimageio.spec._internal.io import interprete_file_source
+from bioimageio.spec._internal.io import get_reader, interprete_file_source
+from bioimageio.spec._internal.type_guards import is_ndarray
 from bioimageio.spec.common import (
+    FileSource,
     HttpUrl,
     PermissiveFileSource,
     RelativeFilePath,
@@ -65,51 +65,51 @@ def load_image(
     else:
         src = parsed_source
 
-    # FIXME: why is pyright complaining about giving the union to _split_dataset_path?
     if isinstance(src, Path):
-        file_source, subpath = _split_dataset_path(src)
+        file_source, suffix, subpath = _split_dataset_path(src)
     elif isinstance(src, HttpUrl):
-        file_source, subpath = _split_dataset_path(src)
+        file_source, suffix, subpath = _split_dataset_path(src)
     elif isinstance(src, ZipPath):
-        file_source, subpath = _split_dataset_path(src)
+        file_source, suffix, subpath = _split_dataset_path(src)
     else:
         assert_never(src)
 
-    path = download(file_source).path
-
-    if path.suffix == ".npy":
+    if suffix == ".npy":
         if subpath is not None:
-            raise ValueError(f"Unexpected subpath {subpath} for .npy path {path}")
-        return load_array(path)
-    elif path.suffix in SUFFIXES_WITH_DATAPATH:
+            logger.warning(
+                "Unexpected subpath {} for .npy source {}", subpath, file_source
+            )
+
+        image = load_array(file_source)
+    elif suffix in SUFFIXES_WITH_DATAPATH:
         if subpath is None:
             dataset_path = DEFAULT_H5_DATASET_PATH
         else:
             dataset_path = str(subpath)
 
-        with h5py.File(path, "r") as f:
+        reader = download(file_source)
+
+        with h5py.File(reader, "r") as f:
             h5_dataset = f.get(  # pyright: ignore[reportUnknownVariableType]
                 dataset_path
             )
             if not isinstance(h5_dataset, h5py.Dataset):
                 raise ValueError(
-                    f"{path} is not of type {h5py.Dataset}, but has type "
+                    f"{file_source} did not load as {h5py.Dataset}, but has type "
                     + str(
                         type(h5_dataset)  # pyright: ignore[reportUnknownArgumentType]
                     )
                 )
             image: NDArray[Any]
             image = h5_dataset[:]  # pyright: ignore[reportUnknownVariableType]
-            assert isinstance(image, np.ndarray), type(
-                image  # pyright: ignore[reportUnknownArgumentType]
-            )
-            return image  # pyright: ignore[reportUnknownVariableType]
-    elif isinstance(path, ZipPath):
-        return imread(
-            path.read_bytes(), extension=path.suffix
-        )  # pyright: ignore[reportUnknownVariableType]
     else:
-        return imread(path)  # pyright: ignore[reportUnknownVariableType]
+        reader = download(file_source)
+        image = imread(  # pyright: ignore[reportUnknownVariableType]
+            reader.read(), extension=suffix
+        )
+
+    assert is_ndarray(image)
+    return image
 
 
 def load_tensor(
@@ -123,19 +123,21 @@ def load_tensor(
 
 _SourceT = TypeVar("_SourceT", Path, HttpUrl, ZipPath)
 
+Suffix = str
+
 
 def _split_dataset_path(
     source: _SourceT,
-) -> Tuple[_SourceT, Optional[PurePosixPath]]:
+) -> Tuple[_SourceT, Suffix, Optional[PurePosixPath]]:
     """Split off subpath (e.g. internal  h5 dataset path)
     from a file path following a file extension.
 
     Examples:
         >>> _split_dataset_path(Path("my_file.h5/dataset"))
-        (...Path('my_file.h5'), PurePosixPath('dataset'))
+        (...Path('my_file.h5'), '.h5', PurePosixPath('dataset'))
 
         >>> _split_dataset_path(Path("my_plain_file"))
-        (...Path('my_plain_file'), None)
+        (...Path('my_plain_file'), '', None)
 
     """
     if isinstance(source, RelativeFilePath):
@@ -148,50 +150,55 @@ def _split_dataset_path(
     def separate_pure_path(path: PurePosixPath):
         for p in path.parents:
             if p.suffix in SUFFIXES_WITH_DATAPATH:
-                return p, PurePosixPath(path.relative_to(p))
+                return p, p.suffix, PurePosixPath(path.relative_to(p))
 
-        return path, None
+        return path, path.suffix, None
 
     if isinstance(src, HttpUrl):
-        file_path, data_path = separate_pure_path(PurePosixPath(src.path or ""))
+        file_path, suffix, data_path = separate_pure_path(PurePosixPath(src.path or ""))
 
         if data_path is None:
-            return src, None
+            return src, suffix, None
 
         return (
             HttpUrl(str(file_path).replace(f"/{data_path}", "")),
+            suffix,
             data_path,
         )
 
     if isinstance(src, ZipPath):
-        file_path, data_path = separate_pure_path(PurePosixPath(str(src)))
+        file_path, suffix, data_path = separate_pure_path(PurePosixPath(str(src)))
 
         if data_path is None:
-            return src, None
+            return src, suffix, None
 
         return (
             ZipPath(str(file_path).replace(f"/{data_path}", "")),
+            suffix,
             data_path,
         )
 
-    file_path, data_path = separate_pure_path(PurePosixPath(src))
-    return Path(file_path), data_path
+    file_path, suffix, data_path = separate_pure_path(PurePosixPath(src))
+    return Path(file_path), suffix, data_path
 
 
 def save_tensor(path: Union[Path, str], tensor: Tensor) -> None:
     # TODO: save axis meta data
 
-    data: NDArray[Any] = tensor.data.to_numpy()
-    file_path, subpath = _split_dataset_path(Path(path))
-    if not file_path.suffix:
+    data: NDArray[Any] = (  # pyright: ignore[reportUnknownVariableType]
+        tensor.data.to_numpy()
+    )
+    assert is_ndarray(data)
+    file_path, suffix, subpath = _split_dataset_path(Path(path))
+    if not suffix:
         raise ValueError(f"No suffix (needed to decide file format) found in {path}")
 
     file_path.parent.mkdir(exist_ok=True, parents=True)
     if file_path.suffix == ".npy":
         if subpath is not None:
             raise ValueError(f"Unexpected subpath {subpath} found in .npy path {path}")
         save_array(file_path, data)
-    elif file_path.suffix in (".h5", ".hdf", ".hdf5"):
+    elif suffix in (".h5", ".hdf", ".hdf5"):
         if subpath is None:
             dataset_path = DEFAULT_H5_DATASET_PATH
         else:
@@ -275,22 +282,39 @@ def load_dataset_stat(path: Path):
 def ensure_unzipped(source: Union[PermissiveFileSource, ZipPath], folder: Path):
     """unzip a (downloaded) **source** to a file in **folder** if source is a zip archive.
     Always returns the path to the unzipped source (maybe source itself)"""
-    local_weights_file = download(source).path
-    if isinstance(local_weights_file, ZipPath):
-        # source is inside a zip archive
-        out_path = folder / local_weights_file.filename
-        with local_weights_file.open("rb") as src, out_path.open("wb") as dst:
-            assert not isinstance(src, TextIOWrapper)
-            copyfileobj(src, dst)
-
-        local_weights_file = out_path
-
-    if zipfile.is_zipfile(local_weights_file):
+    weights_reader = get_reader(source)
+    out_path = folder / (
+        weights_reader.original_file_name or f"file{weights_reader.suffix}"
+    )
+
+    if zipfile.is_zipfile(weights_reader):
+        out_path = out_path.with_name(out_path.name + ".unzipped")
+        out_path.parent.mkdir(exist_ok=True, parents=True)
         # source itself is a zipfile
-        out_path = folder / local_weights_file.with_suffix(".unzipped").name
-        with zipfile.ZipFile(local_weights_file, "r") as f:
+        with zipfile.ZipFile(weights_reader, "r") as f:
             f.extractall(out_path)
 
-        return out_path
     else:
-        return local_weights_file
+        out_path.parent.mkdir(exist_ok=True, parents=True)
+        with out_path.open("wb") as f:
+            copyfileobj(weights_reader, f)
+
+    return out_path
+
+
+def get_suffix(source: Union[ZipPath, FileSource]) -> str:
+    if isinstance(source, Path):
+        return source.suffix
+    elif isinstance(source, ZipPath):
+        return source.suffix
+    if isinstance(source, RelativeFilePath):
+        return source.path.suffix
+    elif isinstance(source, ZipPath):
+        return source.suffix
+    elif isinstance(source, HttpUrl):
+        if source.path is None:
+            return ""
+        else:
+            return PurePosixPath(source.path).suffix
+    else:
+        assert_never(source)
diff --git a/bioimageio/core/utils/_type_guards.py b/bioimageio/core/utils/_type_guards.py
@@ -0,0 +1,8 @@
+"""use these type guards with caution!
+They widen the type to T[Any], which is not always correct."""
+
+from bioimageio.spec._internal import type_guards
+
+is_list = type_guards.is_list  # pyright: ignore[reportPrivateImportUsage]
+is_ndarray = type_guards.is_ndarray  # pyright: ignore[reportPrivateImportUsage]
+is_tuple = type_guards.is_tuple  # pyright: ignore[reportPrivateImportUsage]
diff --git a/dev/env-dev.yaml b/dev/env-dev.yaml
@@ -5,17 +5,19 @@ channels:
   - nodefaults
   - pytorch
 dependencies:
-  - bioimageio.spec==0.5.4.1
+  - bioimageio.spec==0.5.4.3
   - black
   # - crick  # currently requires python<=3.9
   - h5py
+  - httpx
   - imagecodecs
   - imageio>=2.5
   - jupyter
   - jupyter-black
   - keras>=3.0,<4
   - loguru
   - matplotlib
+  - napari
   - numpy
   - onnx
   - onnxruntime
@@ -31,7 +33,7 @@ dependencies:
   - pytest-cov
   # - python=3.11  # removed
   - pytorch>=2.1,<3
-  - requests
+  - respx
   - rich
   - ruff
   - ruyaml