bioimage-io · FynnBe · Oct 26, 2022 · Oct 26, 2022 · Oct 26, 2022 · Oct 26, 2022
diff --git a/bioimageio/spec/__init__.py b/bioimageio/spec/__init__.py
@@ -1,4 +1,4 @@
-from . import collection, model, rdf, shared
+from . import collection, model, rdf, shared, workflow
 from .commands import update_format, update_rdf, validate
 from .io_ import (
     get_resource_package_content,

diff --git a/bioimageio/spec/shared/fields.py b/bioimageio/spec/shared/fields.py
@@ -82,6 +82,10 @@ def deserialize(self, value: typing.Any, attr: str = None, data: typing.Mapping[
             return value
 
 
+class Boolean(DocumentedField, marshmallow_fields.Boolean):
+    pass
+
+
 class DateTime(DocumentedField, marshmallow_fields.DateTime):
     """
     Parses datetime in ISO8601 or if value already has datetime.datetime type

diff --git a/bioimageio/spec/workflow/__init__.py b/bioimageio/spec/workflow/__init__.py
@@ -0,0 +1,14 @@
+from . import v0_2
+
+# autogen: start
+from . import converters, raw_nodes, schema, utils
+from .raw_nodes import FormatVersion
+
+try:
+    from typing import get_args
+except ImportError:
+    from typing_extensions import get_args  # type: ignore
+
+format_version = get_args(FormatVersion)[-1]
+
+# autogen: stop
diff --git a/bioimageio/spec/workflow/converters.py b/bioimageio/spec/workflow/converters.py
@@ -0,0 +1,3 @@
+# Auto-generated by generate_passthrough_modules.py - do not modify
+
+from .v0_2.converters import *
diff --git a/bioimageio/spec/workflow/raw_nodes.py b/bioimageio/spec/workflow/raw_nodes.py
@@ -0,0 +1,3 @@
+# Auto-generated by generate_passthrough_modules.py - do not modify
+
+from .v0_2.raw_nodes import *
diff --git a/bioimageio/spec/workflow/schema.py b/bioimageio/spec/workflow/schema.py
@@ -0,0 +1,3 @@
+# Auto-generated by generate_passthrough_modules.py - do not modify
+
+from .v0_2.schema import *
diff --git a/bioimageio/spec/workflow/utils.py b/bioimageio/spec/workflow/utils.py
@@ -0,0 +1,3 @@
+# Auto-generated by generate_passthrough_modules.py - do not modify
+
+from .v0_2.utils import *
diff --git a/bioimageio/spec/workflow/v0_2/__init__.py b/bioimageio/spec/workflow/v0_2/__init__.py
@@ -0,0 +1,9 @@
+from . import converters, raw_nodes, schema, utils
+from .raw_nodes import FormatVersion
+
+try:
+    from typing import get_args
+except ImportError:
+    from typing_extensions import get_args  # type: ignore
+
+format_version = get_args(FormatVersion)[-1]
diff --git a/bioimageio/spec/workflow/v0_2/converters.py b/bioimageio/spec/workflow/v0_2/converters.py
@@ -0,0 +1,3 @@
+from bioimageio.spec.rdf.v0_2.converters import maybe_convert as maybe_convert_rdf
+
+maybe_convert = maybe_convert_rdf
diff --git a/bioimageio/spec/workflow/v0_2/raw_nodes.py b/bioimageio/spec/workflow/v0_2/raw_nodes.py
@@ -0,0 +1,64 @@
+""" raw nodes for the dataset RDF spec
+
+raw nodes are the deserialized equivalent to the content of any RDF.
+serialization and deserialization are defined in schema:
+RDF <--schema--> raw nodes
+"""
+import typing
+from dataclasses import dataclass
+from pathlib import Path
+from typing import Any, Dict, List, Union
+
+from marshmallow import missing
+from marshmallow.utils import _Missing
+
+from bioimageio.spec.rdf.v0_2.raw_nodes import FormatVersion, RDF as _RDF, URI
+from bioimageio.spec.shared.raw_nodes import RawNode
+
+try:
+    from typing import Literal, get_args
+except ImportError:
+    from typing_extensions import Literal, get_args  # type: ignore
+
+FormatVersion = FormatVersion
+ArgType = Literal["tensor", "int", "float", "string", "boolean", "list", "dict", "any"]
+DefaultType = Union[int, float, str, bool, list, dict, None]
+TYPE_NAME_MAP = {int: "int", float: "float", str: "string", bool: "boolean", list: "list", dict: "dict", None: "null"}
+
+
+@dataclass
+class Arg(RawNode):
+    name: str = missing
+    type: ArgType = missing
+    default: Union[_Missing, DefaultType] = missing
+    description: Union[_Missing, str] = missing
+
+
+@dataclass
+class WorkflowKwarg(RawNode):
+    name: str = missing
+    type: ArgType = missing
+    default: DefaultType = missing
+    description: Union[_Missing, str] = missing
+
+
+@dataclass
+class Step(RawNode):
+    id: Union[_Missing, str] = missing
+    op: str = missing
+    inputs: Union[_Missing, List[str]] = missing
+    outputs: Union[_Missing, List[str]] = missing
+    kwargs: Union[_Missing, Dict[str, Any]] = missing
+
+
+@dataclass
+class Workflow(_RDF):
+    type: Literal["workflow"] = missing
+
+    inputs: List[Arg] = missing
+    outputs: List[Arg] = missing
+
+    steps: List[Step] = missing
+    test_steps: List[Step] = missing
+
+    kwargs: Union[_Missing, List[WorkflowKwarg]] = missing
diff --git a/bioimageio/spec/workflow/v0_2/schema.py b/bioimageio/spec/workflow/v0_2/schema.py
@@ -0,0 +1,228 @@
+import typing
+
+from marshmallow import ValidationError, missing, validates, validates_schema
+
+from bioimageio.spec.rdf.v0_2.schema import RDF
+from bioimageio.spec.shared import field_validators, fields
+from bioimageio.spec.shared.schema import SharedBioImageIOSchema
+from . import raw_nodes
+
+try:
+    from typing import get_args
+except ImportError:
+    from typing_extensions import get_args  # type: ignore
+
+
+class _BioImageIOSchema(SharedBioImageIOSchema):
+    raw_nodes = raw_nodes
+
+
+class Arg(_BioImageIOSchema):
+    name = fields.String(
+        required=True,
+        bioimageio_description="Argument/tensor name. No duplicates are allowed.",
+    )
+    type = fields.String(
+        required=True,
+        validate=field_validators.OneOf(get_args(raw_nodes.ArgType)),
+        bioimageio_description=f"Argument type. One of: {get_args(raw_nodes.ArgType)}",
+    )
+    default = fields.Raw(
+        required=False,
+        bioimageio_description="Default value compatible with type given by `type` field.",
+        allow_none=True,
+    )
+
+    @validates_schema
+    def default_has_compatible_type(self, data, **kwargs):
+        if data.get("default") is None:
+            return
+
+        arg_type_name = data.get("type")
+        if arg_type_name == "any":
+            return
+
+        default_type = type(data["default"])
+        type_name = raw_nodes.TYPE_NAME_MAP[default_type]
+        if type_name != arg_type_name:
+            raise ValidationError(
+                f"Default value of type {default_type} (type name: {type_name}) does not match type: {arg_type_name}"
+            )
+
+    description = fields.String(bioimageio_description="Description of argument/tensor.")
+
+
+class WorkflowKwarg(_BioImageIOSchema):
+    name = fields.String(
+        required=True,
+        bioimageio_description="Key word argument name. No duplicates are allowed.",
+    )
+    type = fields.String(
+        required=True,
+        validate=field_validators.OneOf(get_args(raw_nodes.ArgType)),
+        bioimageio_description=f"Argument type. One of: {get_args(raw_nodes.ArgType)}",
+    )
+    default = fields.Raw(
+        required=True,
+        bioimageio_description="Default value compatible with type given by `type` field.",
+        allow_none=True,
+    )
+
+    @validates_schema
+    def default_has_compatible_type(self, data, **kwargs):
+        if data.get("default") is None:
+            return
+
+        arg_type_name = data.get("type")
+        if arg_type_name == "any":
+            return
+
+        default_type = type(data["default"])
+        type_name = raw_nodes.TYPE_NAME_MAP[default_type]
+        if type_name != arg_type_name:
+            raise ValidationError(
+                f"Default value of type {default_type} (type name: {type_name}) does not match type: {arg_type_name}"
+            )
+
+    description = fields.String(required=False, bioimageio_description="Description of key word argument.")
+
+
+class Step(_BioImageIOSchema):
+    id = fields.String(
+        required=False,
+        validate=field_validators.Predicate("isidentifier"),
+        bioimageio_description="Step id for referencing the steps' kwargs or outputs.",
+    )
+    op = fields.String(
+        required=True,
+        validate=field_validators.Predicate("isidentifier"),
+        bioimageio_description="Name of operation. Must be implemented in bioimageio.core or bioimageio.contrib.",
+    )
+    inputs = fields.List(
+        fields.String(
+            bioimageio_description="named output of a previous step with the pattern '<step id>.outputs.<output name>'",
+        ),
+        required=False,
+    )
+    outputs = fields.List(
+        fields.String(
+            validate=field_validators.Predicate("isidentifier"),
+        ),
+        bioimageio_description="output names for this step",
+        required=False,
+    )
+    kwargs = fields.Kwargs(bioimageio_description="Key word arguments for op.")
+
+
+class Workflow(_BioImageIOSchema, RDF):
+    bioimageio_description = f"""# BioImage.IO Workflow Resource Description File {get_args(raw_nodes.FormatVersion)[-1]}
+This specification defines the fields used in a BioImage.IO-compliant resource description file (`RDF`) for describing workflows.
+These fields are typically stored in a YAML file which we call Workflow Resource Description File or `workflow RDF`.
+
+The workflow RDF YAML file contains mandatory and optional fields. In the following description, optional fields are indicated by _optional_.
+_optional*_ with an asterisk indicates the field is optional depending on the value in another field.
+"""
+    inputs = fields.List(
+        fields.Nested(Arg()),
+        validate=field_validators.Length(min=1),
+        required=True,
+        bioimageio_description="Describes the inputs expected by this workflow.",
+    )
+
+    @validates("inputs")
+    def no_duplicate_input_names(self, value: typing.List[raw_nodes.Arg]):
+        if not isinstance(value, list) or not all(isinstance(v, raw_nodes.Arg) for v in value):
+            raise ValidationError("Could not check for duplicate input names due to another validation error.")
+
+        names = [t.name for t in value]
+        if len(names) > len(set(names)):
+            raise ValidationError("Duplicate input names are not allowed.")
+
+    outputs = fields.List(
+        fields.Nested(Arg()),
+        validate=field_validators.Length(min=1),
+        bioimageio_description="Describes the outputs from this workflow.",
+    )
+
+    @validates("outputs")
+    def no_duplicate_output_names(self, value: typing.List[raw_nodes.Arg]):
+        if not isinstance(value, list) or not all(isinstance(v, raw_nodes.Arg) for v in value):
+            raise ValidationError("Could not check for duplicate output names due to another validation error.")
+
+        names = [t["name"] if isinstance(t, dict) else t.name for t in value]
+        if len(names) > len(set(names)):
+            raise ValidationError("Duplicate output names are not allowed.")
+
+    @validates_schema
+    def inputs_and_outputs(self, data, **kwargs):
+        ipts: typing.List[raw_nodes.Arg] = data.get("inputs")
+        outs: typing.List[raw_nodes.Arg] = data.get("outputs")
+        if any(
+            [
+                not isinstance(ipts, list),
+                not isinstance(outs, list),
+                not all(isinstance(v, raw_nodes.Arg) for v in ipts),
+                not all(isinstance(v, raw_nodes.Arg) for v in outs),
+            ]
+        ):
+            raise ValidationError("Could not check for duplicate names due to another validation error.")
+
+        # no duplicate names
+        names = [t.name for t in ipts + outs]  # type: ignore
+        if len(names) > len(set(names)):
+            raise ValidationError("Duplicate names are not allowed.")
+
+    kwargs = fields.List(
+        fields.Nested(WorkflowKwarg()),
+        required=False,
+        bioimageio_description="Key word arguments for this workflow.",
+    )
+
+    steps = fields.List(
+        fields.Nested(Step()),
+        validate=field_validators.Length(min=1),
+        required=True,
+        bioimageio_description="Workflow steps to be executed consecutively.",
+    )
+
+    @validates_schema
+    def step_input_references_exist(self, data, **kwargs):
+        inputs = data.get("inputs")
+        if not inputs or not isinstance(inputs, list) or not all(isinstance(ipt, raw_nodes.Arg) for ipt in inputs):
+            raise ValidationError("Missing/invalid 'inputs'")
+        steps = data.get("steps")
+        if not steps or not isinstance(steps, list) or not isinstance(steps[0], raw_nodes.Step):
+            raise ValidationError("Missing/invalid 'steps'")
+
+        references = {f"inputs.{ipt.name}" for ipt in inputs}
+        for step in steps:
+            if step.inputs:
+                for si in step.inputs:
+                    if si not in references:
+                        raise ValidationError(f"Invalid step input reference '{si}'")
+
+            if step.outputs:
+                references.update({f"{step.id}.outputs.{out}" for out in step.outputs})
+
+    test_steps = fields.List(
+        fields.Nested(Step()),
+        validate=field_validators.Length(min=1),
+        required=True,
+        bioimageio_description="Test steps to be executed consecutively.",
+    )
+
+    @validates_schema
+    def test_step_input_references_exist(self, data, **kwargs):
+        steps = data.get("test_steps")
+        if not steps or not isinstance(steps, list) or not isinstance(steps[0], raw_nodes.Step):
+            raise ValidationError("Missing/invalid 'test_steps'")
+
+        references = set()
+        for step in steps:
+            if step.inputs:
+                for si in step.inputs:
+                    if si not in references:
+                        raise ValidationError(f"Invalid test step input reference '{si}'")
+
+            if step.outputs:
+                references.update({f"{step.id}.outputs.{out}" for out in step.outputs})
diff --git a/bioimageio/spec/workflow/v0_2/utils.py b/bioimageio/spec/workflow/v0_2/utils.py
@@ -0,0 +1,5 @@
+from . import raw_nodes
+
+
+def filter_resource_description(raw_rd: raw_nodes.Workflow) -> raw_nodes.Workflow:
+    return raw_rd
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1,3 @@
		# Auto-generated by generate_passthrough_modules.py - do not modify

		from .v0_2.converters import *
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1,3 @@
		# Auto-generated by generate_passthrough_modules.py - do not modify

		from .v0_2.raw_nodes import *
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1,3 @@
		# Auto-generated by generate_passthrough_modules.py - do not modify

		from .v0_2.schema import *
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1,3 @@
		# Auto-generated by generate_passthrough_modules.py - do not modify

		from .v0_2.utils import *
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1,3 @@
		from bioimageio.spec.rdf.v0_2.converters import maybe_convert as maybe_convert_rdf

		maybe_convert = maybe_convert_rdf