test_steps and better workflow kwargs

bioimage-io · FynnBe · Oct 26, 2022 · Oct 26, 2022 · Oct 26, 2022 · Oct 26, 2022
commit fe9243e2694acdf34ccaa8bd35248f17e68fa811
diff --git a/bioimageio/spec/shared/fields.py b/bioimageio/spec/shared/fields.py
@@ -82,6 +82,10 @@ def deserialize(self, value: typing.Any, attr: str = None, data: typing.Mapping[
             return value
 
 
+class Boolean(DocumentedField, marshmallow_fields.Boolean):
+    pass
+
+
 class DateTime(DocumentedField, marshmallow_fields.DateTime):
     """
     Parses datetime in ISO8601 or if value already has datetime.datetime type

diff --git a/bioimageio/spec/workflow/v0_2/raw_nodes.py b/bioimageio/spec/workflow/v0_2/raw_nodes.py
@@ -4,6 +4,7 @@
 serialization and deserialization are defined in schema:
 RDF <--schema--> raw nodes
 """
+import typing
 from dataclasses import dataclass
 from pathlib import Path
 from typing import Any, Dict, List, Union
@@ -15,18 +16,29 @@
 from bioimageio.spec.shared.raw_nodes import RawNode
 
 try:
-    from typing import Literal
+    from typing import Literal, get_args
 except ImportError:
-    from typing_extensions import Literal  # type: ignore
+    from typing_extensions import Literal, get_args  # type: ignore
 
 FormatVersion = FormatVersion
-ArgType = Literal["tensor", "string", "object"]
+ArgType = Literal["tensor", "int", "float", "string", "boolean", "list", "dict", "any"]
+DefaultType = Union[int, float, str, bool, list, dict, None]
+TYPE_NAME_MAP = {int: "int", float: "float", str: "string", bool: "boolean", list: "list", dict: "dict", None: "null"}
 
 
 @dataclass
 class Arg(RawNode):
     name: str = missing
     type: ArgType = missing
+    default: Union[_Missing, DefaultType] = missing
+    description: Union[_Missing, str] = missing
+
+
+@dataclass
+class WorkflowKwarg(RawNode):
+    name: str = missing
+    type: ArgType = missing
+    default: DefaultType = missing
     description: Union[_Missing, str] = missing
 
 
@@ -46,7 +58,7 @@ class Workflow(_RDF):
     inputs: List[Arg] = missing
     outputs: List[Arg] = missing
 
-    test_inputs: List[Union[URI, Path]] = missing
-    test_outputs: List[Union[URI, Path]] = missing
-
     steps: List[Step] = missing
+    test_steps: List[Step] = missing
+
+    kwargs: Union[_Missing, List[WorkflowKwarg]] = missing
diff --git a/bioimageio/spec/workflow/v0_2/schema.py b/bioimageio/spec/workflow/v0_2/schema.py
@@ -27,9 +27,66 @@ class Arg(_BioImageIOSchema):
         validate=field_validators.OneOf(get_args(raw_nodes.ArgType)),
         bioimageio_description=f"Argument type. One of: {get_args(raw_nodes.ArgType)}",
     )
+    default = fields.Raw(
+        required=False,
+        bioimageio_description="Default value compatible with type given by `type` field.",
+        allow_none=True,
+    )
+
+    @validates_schema
+    def default_has_compatible_type(self, data, **kwargs):
+        if data.get("default") is None:
+            return
+
+        arg_type_name = data.get("type")
+        if arg_type_name == "any":
+            return
+
+        default_type = type(data["default"])
+        type_name = raw_nodes.TYPE_NAME_MAP[default_type]
+        if type_name != arg_type_name:
+            raise ValidationError(
+                f"Default value of type {default_type} (type name: {type_name}) does not match type: {arg_type_name}"
+            )
+
     description = fields.String(bioimageio_description="Description of argument/tensor.")
 
 
+class WorkflowKwarg(_BioImageIOSchema):
+    name = fields.String(
+        required=True,
+        bioimageio_description="Key word argument name. No duplicates are allowed.",
+    )
+    type = fields.String(
+        required=True,
+        validate=field_validators.OneOf(get_args(raw_nodes.ArgType)),
+        bioimageio_description=f"Argument type. One of: {get_args(raw_nodes.ArgType)}",
+    )
+    default = fields.Raw(
+        required=True,
+        bioimageio_description="Default value compatible with type given by `type` field.",
+        allow_none=True,
+    )
+
+    @validates_schema
+    def default_has_compatible_type(self, data, **kwargs):
+        if data.get("default") is None:
+            return
+
+        arg_type_name = data.get("type")
+        if arg_type_name == "any":
+            return
+
+        default_type = type(data["default"])
+        type_name = raw_nodes.TYPE_NAME_MAP[default_type]
+        if type_name != arg_type_name:
+            raise ValidationError(
+                f"Default value of type {default_type} (type name: {type_name}) does not match type: {arg_type_name}"
+            )
+
+    description = fields.String(required=False, bioimageio_description="Description of key word argument.")
+
+
 class Step(_BioImageIOSchema):
     id = fields.String(
         required=False,
@@ -69,7 +126,7 @@ class Workflow(_BioImageIOSchema, RDF):
         fields.Nested(Arg()),
         validate=field_validators.Length(min=1),
         required=True,
-        bioimageio_description="Describes the inputs expected by this model.",
+        bioimageio_description="Describes the inputs expected by this workflow.",
     )
 
     @validates("inputs")
@@ -84,7 +141,7 @@ def no_duplicate_input_names(self, value: typing.List[raw_nodes.Arg]):
     outputs = fields.List(
         fields.Nested(Arg()),
         validate=field_validators.Length(min=1),
-        bioimageio_description="Describes the outputs from this model.",
+        bioimageio_description="Describes the outputs from this workflow.",
     )
 
     @validates("outputs")
@@ -115,41 +172,12 @@ def inputs_and_outputs(self, data, **kwargs):
         if len(names) > len(set(names)):
             raise ValidationError("Duplicate names are not allowed.")
 
-    test_inputs = fields.List(
-        fields.Union([fields.URI(), fields.Path()]),
-        validate=field_validators.Length(min=1),
-        required=True,
-        bioimageio_description="List of URIs or local relative paths to test inputs as described in inputs for "
-        "**a single test case**. "
-        "This means if your workflow has more than one input, you should provide one URI for each input."
-        "Each test input should be a file with a ndarray in "
-        "[numpy.lib file format](https://numpy.org/doc/stable/reference/generated/numpy.lib.format.html#module-numpy.lib.format)."
-        "The extension must be '.npy'.",
-    )
-
-    test_outputs = fields.List(
-        fields.Union([fields.URI(), fields.Path()]),
-        validate=field_validators.Length(min=1),
-        required=True,
-        bioimageio_description="Analog to test_inputs.",
+    kwargs = fields.List(
+        fields.Nested(WorkflowKwarg()),
+        required=False,
+        bioimageio_description="Key word arguments for this workflow.",
     )
 
-    @validates_schema
-    def test_outputs_match(self, data, **kwargs):
-        steps = data.get("steps")
-        if not steps or not isinstance(steps, list) or not isinstance(steps[-1], raw_nodes.Step):
-            raise ValidationError("invalid 'steps'")
-
-        test_outputs = data.get("test_outputs")
-        if not isinstance(test_outputs, list):
-            raise ValidationError("invalid 'test_outputs'")
-
-        if steps[-1].op == "select_outputs":
-            if steps[-1].outputs:
-                raise ValidationError("Unexpected 'outputs' defined for op: 'select_outputs'. Did you mean 'inputs'?")
-            if len(test_outputs) != len(steps[-1].inputs):
-                raise ValidationError(f"Expected {len(steps[-1].inputs)} 'test_inputs', but found {len(test_outputs)}")
-
     steps = fields.List(
         fields.Nested(Step()),
         validate=field_validators.Length(min=1),
@@ -175,3 +203,26 @@ def step_input_references_exist(self, data, **kwargs):
 
             if step.outputs:
                 references.update({f"{step.id}.outputs.{out}" for out in step.outputs})
+
+    test_steps = fields.List(
+        fields.Nested(Step()),
+        validate=field_validators.Length(min=1),
+        required=True,
+        bioimageio_description="Test steps to be executed consecutively.",
+    )
+
+    @validates_schema
+    def test_step_input_references_exist(self, data, **kwargs):
+        steps = data.get("test_steps")
+        if not steps or not isinstance(steps, list) or not isinstance(steps[0], raw_nodes.Step):
+            raise ValidationError("Missing/invalid 'test_steps'")
+
+        references = set()
+        for step in steps:
+            if step.inputs:
+                for si in step.inputs:
+                    if si not in references:
+                        raise ValidationError(f"Invalid test step input reference '{si}'")
+
+            if step.outputs:
+                references.update({f"{step.id}.outputs.{out}" for out in step.outputs})
diff --git a/example_specs/workflows/hpa/single_cell_classification.yaml b/example_specs/workflows/hpa/single_cell_classification.yaml
@@ -9,36 +9,53 @@ inputs:
 - name: protein
   type: tensor
 
-test_inputs:
-- nuclei.npy
-- protein.npy
+kwargs:
+- name: seg_prep
+  type: boolean
+  default: false
+
 
 outputs:
 - name: cells
   type: tensor
 - name: scores
   type: tensor
 
-test_outputs:
-- cells.npy
-- scores.npy
 
 steps:
+- op: set_
 - id: segmentation
   op: model_inference
   inputs: [inputs.nuclei]  # take the first output of step 1 (id: data) as the only input
   outputs: [cells]
   kwargs:
-    model_id: conscientious-seashell
-    preprocessing: true
+    rdf_source: conscientious-seashell
+    preprocessing: ${{ kwargs.seg_prep }}
     postprocessing: false
 - id: classification
   op: model_inference
   inputs: [inputs.protein, segmentation.outputs.cells]  # take the second output of step1 and the output of step 2
   outputs: [scores]
   kwargs:
-    model_id: straightforward-crocodile
+    rdf_source: straightforward-crocodile
     preprocessing: true
     postprocessing: false
 - op: select_outputs
   inputs: [segmentation.outputs.cells,  classification.outputs.scores]
+
+test_steps:
+- id: test_tensors
+  op: load_tensors
+  outputs: [nuclei, protein, cells, scores]
+  kwargs:
+    sources: [nuclei.npy, protein.npy, cells.npy, scores.npy]
+- id: workflow
+  op: run_workflow
+  inputs: [test_tensors.outputs.nuclei, test_tensors.outputs.protein]
+  outputs: [cells, scores]
+  kwargs:
+    rdf_source: ${{ self.rdf_source }}
+- op: assert_close
+  inputs: [test_tensors.outputs.cells, workflow.outputs.cells]
+- op: assert_close
+  inputs: [test_tensors.outputs.scores, workflow.outputs.scores]
diff --git a/example_specs/workflows/stardist/stardist_example.yaml b/example_specs/workflows/stardist/stardist_example.yaml
@@ -8,9 +8,6 @@ inputs:
   type: tensor
   description: image with star-convex objects
 
-test_inputs:
-- raw.npy
-
 outputs:
 - name: labels
   type: tensor
@@ -21,19 +18,53 @@ outputs:
 - name: prob
   type: tensor
 
-test_outputs:
-- labels.npy
-- coord.npy
-- points.npy
-- prob.npy
+kwargs:
+- name: diameter
+  type: float
+  default: 2.3
 
 steps:
 - op: zero_mean_unit_variance
 - op: model_inference
   kwargs:
-    model_id: fearless-crab
+    rdf_source: fearless-crab
     preprocessing: false # disable the preprocessing
     postprocessing: false # disable the postprocessing
 - op: stardist_postprocessing
   kwargs:
-    diameter: 2.3
+    diameter: ${{ kwargs.diameter }}
+
+test_steps:
+- id: test_tensors
+  op: load_tensors
+  outputs:
+    - raw
+    - labels
+    - coord
+    - points
+    - prob
+  kwargs:
+    sources:
+    - raw.npy
+    - labels.npy
+    - coord.npy
+    - points.npy
+    - prob.npy
+- id: workflow
+  op: run_workflow
+  inputs: [test_tensors.outputs.raw]
+  outputs:
+    - labels
+    - coord
+    - points
+    - prob
+  kwargs:
+    rdf_source: ${{ self.rdf_source }}
+- op: assert_close
+  inputs: [test_tensors.outputs.labels, workflow.outputs.labels]
+- op: assert_close
+  inputs: [test_tensors.outputs.coord, workflow.outputs.coord]
+- op: assert_close
+  inputs: [test_tensors.outputs.points, workflow.outputs.points]
+- op: assert_close
+  inputs: [test_tensors.outputs.prob, workflow.outputs.prob]