From 922a1ec3caa7790b177d4fd72c098483aa8d127f Mon Sep 17 00:00:00 2001
From: mvdbeek <m.vandenbeek@gmail.com>
Date: Mon, 23 Oct 2023 19:30:41 +0200
Subject: [PATCH 1/7] Don't run through collect_outputs in test mode

---
 planemo/galaxy/activity.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/planemo/galaxy/activity.py b/planemo/galaxy/activity.py
index de382a875..00e50739b 100644
--- a/planemo/galaxy/activity.py
+++ b/planemo/galaxy/activity.py
@@ -244,7 +244,7 @@ def _execute(  # noqa C901
         end_datetime=datetime.now(),
         **response_kwds,
     )
-    if kwds.get("download_outputs", True):
+    if kwds.get("download_outputs"):
         output_directory = kwds.get("output_directory", None)
         ctx.vlog("collecting outputs from run...")
         run_response.collect_outputs(ctx, output_directory)

From 5ff19c851c07cc13b5d054c494911a9b6e6e7709 Mon Sep 17 00:00:00 2001
From: mvdbeek <m.vandenbeek@gmail.com>
Date: Wed, 25 Oct 2023 19:01:50 +0200
Subject: [PATCH 2/7] Ignore missing invocation outputs when fetching outputs

This isn't happening at the right place.
---
 planemo/engine/cwltool.py   |  8 +++++++-
 planemo/engine/galaxy.py    | 15 +++++++++++---
 planemo/engine/interface.py | 16 ++++++++++-----
 planemo/engine/toil.py      |  7 ++++++-
 planemo/galaxy/activity.py  | 41 ++++++++++++++++++++++++-------------
 5 files changed, 63 insertions(+), 24 deletions(-)

diff --git a/planemo/engine/cwltool.py b/planemo/engine/cwltool.py
index 600de0f16..ba595b1f6 100644
--- a/planemo/engine/cwltool.py
+++ b/planemo/engine/cwltool.py
@@ -1,5 +1,11 @@
 """Module contianing the :class:`CwlToolEngine` implementation of :class:`Engine`."""
 
+from typing import (
+    Callable,
+    List,
+    Optional,
+)
+
 from planemo import cwl
 from planemo.runnable import RunnableType
 from .interface import BaseEngine
@@ -13,7 +19,7 @@ class CwlToolEngine(BaseEngine):
 
     handled_runnable_types = [RunnableType.cwl_tool, RunnableType.cwl_workflow]
 
-    def _run(self, runnables, job_paths):
+    def _run(self, runnables, job_paths, output_collectors: Optional[List[Callable]] = None):
         """Run CWL job using cwltool."""
         results = []
         for runnable, job_path in zip(runnables, job_paths):
diff --git a/planemo/engine/galaxy.py b/planemo/engine/galaxy.py
index 16f2ef81d..90f76530d 100644
--- a/planemo/engine/galaxy.py
+++ b/planemo/engine/galaxy.py
@@ -2,7 +2,12 @@
 
 import abc
 import contextlib
-from typing import TYPE_CHECKING
+from typing import (
+    Callable,
+    List,
+    Optional,
+    TYPE_CHECKING,
+)
 
 from galaxy.tool_util.verify import interactor
 
@@ -44,10 +49,12 @@ class GalaxyEngine(BaseEngine, metaclass=abc.ABCMeta):
         RunnableType.directory,
     ]
 
-    def _run(self, runnables, job_paths):
+    def _run(self, runnables, job_paths, output_collectors: Optional[List[Callable]] = None):
         """Run job in Galaxy."""
         results = []
-        for runnable, job_path in zip(runnables, job_paths):
+        if not output_collectors:
+            output_collectors = [None] * len(runnables)
+        for runnable, job_path, collect_output in zip(runnables, job_paths, output_collectors):
             self._ctx.vlog(f"Serving artifact [{runnable}] with Galaxy.")
             with self.ensure_runnables_served([runnable]) as config:
                 self._ctx.vlog(f"Running job path [{job_path}]")
@@ -55,6 +62,8 @@ def _run(self, runnables, job_paths):
                     self._ctx.log(f"Running Galaxy with API configuration [{config.user_api_config}]")
                 run_response = execute(self._ctx, config, runnable, job_path, **self._kwds)
                 results.append(run_response)
+                if collect_output:
+                    collect_output(run_response)
 
         return results
 
diff --git a/planemo/engine/interface.py b/planemo/engine/interface.py
index 8d9efce0f..f7e935eef 100644
--- a/planemo/engine/interface.py
+++ b/planemo/engine/interface.py
@@ -4,7 +4,11 @@
 import json
 import os
 import tempfile
-from typing import List
+from typing import (
+    Callable,
+    List,
+    Optional,
+)
 
 from planemo.exit_codes import EXIT_CODE_UNSUPPORTED_FILE_TYPE
 from planemo.io import error
@@ -48,14 +52,14 @@ def can_run(self, runnable):
     def cleanup(self):
         """Default no-op cleanup method."""
 
-    def run(self, runnables, job_paths):
+    def run(self, runnables, job_paths, output_collectors: Optional[List[Callable]] = None):
         """Run a job using a compatible artifact (workflow or tool)."""
         self._check_can_run_all(runnables)
-        run_responses = self._run(runnables, job_paths)
+        run_responses = self._run(runnables, job_paths, output_collectors)
         return run_responses
 
     @abc.abstractmethod
-    def _run(self, runnables, job_path):
+    def _run(self, runnables, job_path, output_collectors: Optional[List[Callable]] = None):
         """Run a job using a compatible artifact (workflow or tool) wrapped as a runnable."""
 
     def _check_can_run(self, runnable):
@@ -94,6 +98,7 @@ def _run_test_cases(self, test_cases, test_timeout):
         runnables = [test_case.runnable for test_case in test_cases]
         job_paths = []
         tmp_paths = []
+        output_collectors = []
         for test_case in test_cases:
             if test_case.job_path is None:
                 job = test_case.job
@@ -111,8 +116,9 @@ def _run_test_cases(self, test_cases, test_timeout):
                 job_paths.append(job_path)
             else:
                 job_paths.append(test_case.job_path)
+            output_collectors.append(lambda run_response: test_case.structured_test_data(run_response))
         try:
-            run_responses = self._run(runnables, job_paths)
+            run_responses = self._run(runnables, job_paths, output_collectors)
         finally:
             for tmp_path in tmp_paths:
                 os.remove(tmp_path)
diff --git a/planemo/engine/toil.py b/planemo/engine/toil.py
index f85c5aa72..bf6b9160c 100644
--- a/planemo/engine/toil.py
+++ b/planemo/engine/toil.py
@@ -1,4 +1,9 @@
 """Module contianing the :class:`ToilEngine` implementation of :class:`Engine`."""
+from typing import (
+    Callable,
+    List,
+    Optional,
+)
 
 from planemo import cwl
 from planemo.runnable import RunnableType
@@ -13,7 +18,7 @@ class ToilEngine(BaseEngine):
 
     handled_runnable_types = [RunnableType.cwl_tool, RunnableType.cwl_workflow]
 
-    def _run(self, runnables, job_paths):
+    def _run(self, runnables, job_paths, output_collectors: Optional[List[Callable]] = None):
         """Run CWL job using Toil."""
         results = []
         for runnable, job_path in zip(runnables, job_paths):
diff --git a/planemo/galaxy/activity.py b/planemo/galaxy/activity.py
index 00e50739b..c3a5fa5a6 100644
--- a/planemo/galaxy/activity.py
+++ b/planemo/galaxy/activity.py
@@ -56,6 +56,7 @@
 if TYPE_CHECKING:
     from planemo.cli import PlanemoCliContext
     from planemo.galaxy.config import BaseGalaxyConfig
+    from planemo.runnable import RunnableOutput
 
 DEFAULT_HISTORY_NAME = "CWL Target History"
 ERR_NO_SUCH_TOOL = (
@@ -247,7 +248,7 @@ def _execute(  # noqa C901
     if kwds.get("download_outputs"):
         output_directory = kwds.get("output_directory", None)
         ctx.vlog("collecting outputs from run...")
-        run_response.collect_outputs(ctx, output_directory)
+        run_response.collect_outputs(output_directory)
         ctx.vlog("collecting outputs complete")
     return run_response
 
@@ -359,7 +360,7 @@ def __init__(
 
         self._job_info = None
 
-        self._outputs_dict = None
+        self._outputs_dict: Optional[Dict[str, Optional[str]]] = None
         self._start_datetime = start_datetime
         self._end_datetime = end_datetime
         self._successful = successful
@@ -385,6 +386,9 @@ def end_datetime(self):
         """End datetime of run."""
         return self._end_datetime
 
+    def output_src(self, output: "RunnableOutput", ignore_missing_outputs: bool = False) -> Dict[str, str]:
+        return {}
+
     def _get_extra_files(self, dataset_details):
         extra_files_url = (
             f"{self._user_gi.url}/histories/{self._history_id}/contents/{dataset_details['id']}/extra_files"
@@ -406,19 +410,19 @@ def _get_metadata(self, history_content_type, content_id):
         else:
             raise Exception("Unknown history content type encountered [%s]" % history_content_type)
 
-    def collect_outputs(self, ctx, output_directory):
-        outputs_dict = {}
+    def collect_outputs(self, output_directory: Optional[str] = None, ignore_missing_output: Optional[bool] = False):
+        outputs_dict: Dict[str, Optional[str]] = {}
         # TODO: rather than creating a directory just use
         # Galaxy paths if they are available in this
         # configuration.
         output_directory = output_directory or tempfile.mkdtemp()
 
-        ctx.log("collecting outputs to directory %s" % output_directory)
+        self._ctx.log("collecting outputs to directory %s" % output_directory)
 
         for runnable_output in get_outputs(self._runnable, gi=self._user_gi):
             output_id = runnable_output.get_id()
             if not output_id:
-                ctx.log("Workflow output identified without an ID (label), skipping")
+                self._ctx.log("Workflow output identified without an ID (label), skipping")
                 continue
 
             def get_dataset(dataset_details, filename=None):
@@ -429,9 +433,13 @@ def get_dataset(dataset_details, filename=None):
                     # and this is confusing...
                     the_output_directory = os.path.join(output_directory, parent_basename)
                     safe_makedirs(the_output_directory)
-                    destination = self.download_output_to(ctx, dataset_details, the_output_directory, filename=filename)
+                    destination = self.download_output_to(
+                        self._ctx, dataset_details, the_output_directory, filename=filename
+                    )
                 else:
-                    destination = self.download_output_to(ctx, dataset_details, output_directory, filename=filename)
+                    destination = self.download_output_to(
+                        self._ctx, dataset_details, output_directory, filename=filename
+                    )
                 if filename is None:
                     basename = parent_basename
                 else:
@@ -440,10 +448,10 @@ def get_dataset(dataset_details, filename=None):
                 return {"path": destination, "basename": basename}
 
             is_cwl = self._runnable.type in [RunnableType.cwl_workflow, RunnableType.cwl_tool]
-            output_src = self.output_src(runnable_output)
+            output_src = self.output_src(runnable_output, ignore_missing_output)
             if not output_src:
-                # Optional workflow output
-                ctx.vlog(f"Optional workflow output '{output_id}' not created, skipping")
+                # Optional workflow output or invocation failed
+                self._ctx.vlog(f"workflow output '{output_id}' not created, skipping")
                 outputs_dict[output_id] = None
                 continue
             output_dataset_id = output_src["id"]
@@ -476,7 +484,7 @@ def attach_file_properties(collection, cwl_output):
             outputs_dict[output_id] = output_dict_value
 
         self._outputs_dict = outputs_dict
-        ctx.vlog("collected outputs [%s]" % self._outputs_dict)
+        self._ctx.vlog("collected outputs [%s]" % self._outputs_dict)
 
     @property
     def log(self):
@@ -499,6 +507,8 @@ def invocation_details(self):
 
     @property
     def outputs_dict(self):
+        if self._outputs_dict is None:
+            self.collect_outputs(ignore_missing_output=True)
         return self._outputs_dict
 
     def download_output_to(self, ctx, dataset_details, output_directory, filename=None):
@@ -578,7 +588,7 @@ def to_galaxy_output(self, runnable_output):
         output_id = runnable_output.get_id()
         return tool_response_to_output(self.api_run_response, self._history_id, output_id)
 
-    def output_src(self, output):
+    def output_src(self, output, ignore_missing_outputs=False):
         outputs = self.api_run_response["outputs"]
         output_collections = self.api_run_response["output_collections"]
         output_id = output.get_id()
@@ -632,7 +642,7 @@ def to_galaxy_output(self, runnable_output):
         self._ctx.vlog("checking for output in invocation [%s]" % self._invocation)
         return invocation_to_output(self._invocation, self._history_id, output_id)
 
-    def output_src(self, output):
+    def output_src(self, output, ignore_missing_outputs=False):
         invocation = self._invocation
         # Use newer workflow outputs API.
 
@@ -643,6 +653,9 @@ def output_src(self, output):
             return invocation["output_collections"][output.get_id()]
         elif output.is_optional():
             return None
+        elif ignore_missing_outputs:
+            # We don't need to check this in testing mode, we'll get an error through failed invocation and failed history anyway
+            return None
         else:
             raise Exception(f"Failed to find output [{output_name}] in invocation outputs [{invocation['outputs']}]")
 

From de8b2a9fe094056553adde4949cac10898265702 Mon Sep 17 00:00:00 2001
From: mvdbeek <m.vandenbeek@gmail.com>
Date: Fri, 27 Oct 2023 13:37:22 +0200
Subject: [PATCH 3/7] Download outputs only if needed in test assertions

---
 planemo/cwl/run.py         |  2 +-
 planemo/engine/galaxy.py   |  4 ++--
 planemo/galaxy/activity.py | 45 ++++++++++++++++++++++++--------------
 planemo/runnable.py        | 21 ++++++++++++------
 4 files changed, 46 insertions(+), 26 deletions(-)

diff --git a/planemo/cwl/run.py b/planemo/cwl/run.py
index 7a2b8f472..bf22db886 100644
--- a/planemo/cwl/run.py
+++ b/planemo/cwl/run.py
@@ -62,7 +62,7 @@ def invocation_details(self) -> None:
         return None
 
     @property
-    def outputs_dict(self) -> Optional[Dict[str, Any]]:
+    def outputs_dict(self):
         return self._outputs
 
 
diff --git a/planemo/engine/galaxy.py b/planemo/engine/galaxy.py
index 90f76530d..1c2c6e97c 100644
--- a/planemo/engine/galaxy.py
+++ b/planemo/engine/galaxy.py
@@ -53,7 +53,7 @@ def _run(self, runnables, job_paths, output_collectors: Optional[List[Callable]]
         """Run job in Galaxy."""
         results = []
         if not output_collectors:
-            output_collectors = [None] * len(runnables)
+            output_collectors = [lambda x: None] * len(runnables)
         for runnable, job_path, collect_output in zip(runnables, job_paths, output_collectors):
             self._ctx.vlog(f"Serving artifact [{runnable}] with Galaxy.")
             with self.ensure_runnables_served([runnable]) as config:
@@ -62,7 +62,7 @@ def _run(self, runnables, job_paths, output_collectors: Optional[List[Callable]]
                     self._ctx.log(f"Running Galaxy with API configuration [{config.user_api_config}]")
                 run_response = execute(self._ctx, config, runnable, job_path, **self._kwds)
                 results.append(run_response)
-                if collect_output:
+                if collect_output is not None:
                     collect_output(run_response)
 
         return results
diff --git a/planemo/galaxy/activity.py b/planemo/galaxy/activity.py
index c3a5fa5a6..6dead53da 100644
--- a/planemo/galaxy/activity.py
+++ b/planemo/galaxy/activity.py
@@ -360,7 +360,7 @@ def __init__(
 
         self._job_info = None
 
-        self._outputs_dict: Optional[Dict[str, Optional[str]]] = None
+        self._outputs_dict: Dict[str, Optional[str]] = {}
         self._start_datetime = start_datetime
         self._end_datetime = end_datetime
         self._successful = successful
@@ -386,7 +386,11 @@ def end_datetime(self):
         """End datetime of run."""
         return self._end_datetime
 
-    def output_src(self, output: "RunnableOutput", ignore_missing_outputs: bool = False) -> Dict[str, str]:
+    @property
+    def outputs_dict(self):
+        return self._outputs_dict
+
+    def output_src(self, output: "RunnableOutput", ignore_missing_outputs: Optional[bool] = False) -> Dict[str, str]:
         return {}
 
     def _get_extra_files(self, dataset_details):
@@ -410,7 +414,12 @@ def _get_metadata(self, history_content_type, content_id):
         else:
             raise Exception("Unknown history content type encountered [%s]" % history_content_type)
 
-    def collect_outputs(self, output_directory: Optional[str] = None, ignore_missing_output: Optional[bool] = False):
+    def collect_outputs(
+        self,
+        output_directory: Optional[str] = None,
+        ignore_missing_output: Optional[bool] = False,
+        output_id: Optional[str] = None,
+    ):
         outputs_dict: Dict[str, Optional[str]] = {}
         # TODO: rather than creating a directory just use
         # Galaxy paths if they are available in this
@@ -420,13 +429,16 @@ def collect_outputs(self, output_directory: Optional[str] = None, ignore_missing
         self._ctx.log("collecting outputs to directory %s" % output_directory)
 
         for runnable_output in get_outputs(self._runnable, gi=self._user_gi):
-            output_id = runnable_output.get_id()
-            if not output_id:
+            runnable_output_id = runnable_output.get_id()
+            if not runnable_output_id:
                 self._ctx.log("Workflow output identified without an ID (label), skipping")
                 continue
 
+            if output_id and runnable_output_id != output_id:
+                continue
+
             def get_dataset(dataset_details, filename=None):
-                parent_basename = sanitize_filename(dataset_details.get("cwl_file_name") or output_id)
+                parent_basename = sanitize_filename(dataset_details.get("cwl_file_name") or runnable_output_id)
                 file_ext = dataset_details["file_ext"]
                 if file_ext == "directory":
                     # TODO: rename output_directory to outputs_directory because we can have output directories
@@ -451,8 +463,8 @@ def get_dataset(dataset_details, filename=None):
             output_src = self.output_src(runnable_output, ignore_missing_output)
             if not output_src:
                 # Optional workflow output or invocation failed
-                self._ctx.vlog(f"workflow output '{output_id}' not created, skipping")
-                outputs_dict[output_id] = None
+                self._ctx.vlog(f"workflow output '{runnable_output_id}' not created, skipping")
+                outputs_dict[runnable_output_id] = None
                 continue
             output_dataset_id = output_src["id"]
             galaxy_output = self.to_galaxy_output(runnable_output)
@@ -481,7 +493,9 @@ def attach_file_properties(collection, cwl_output):
                 attach_file_properties(output_metadata, cwl_output)
                 output_dict_value = output_metadata
 
-            outputs_dict[output_id] = output_dict_value
+            if output_id:
+                return output_dict_value
+            outputs_dict[runnable_output_id] = output_dict_value
 
         self._outputs_dict = outputs_dict
         self._ctx.vlog("collected outputs [%s]" % self._outputs_dict)
@@ -505,11 +519,10 @@ def job_info(self):
     def invocation_details(self):
         return None
 
-    @property
-    def outputs_dict(self):
-        if self._outputs_dict is None:
-            self.collect_outputs(ignore_missing_output=True)
-        return self._outputs_dict
+    def get_output(self, output_id):
+        if output_id not in self._outputs_dict:
+            self._outputs_dict[output_id] = self.collect_outputs(ignore_missing_output=True, output_id=output_id)
+        return self._outputs_dict[output_id]
 
     def download_output_to(self, ctx, dataset_details, output_directory, filename=None):
         if filename is None:
@@ -588,7 +601,7 @@ def to_galaxy_output(self, runnable_output):
         output_id = runnable_output.get_id()
         return tool_response_to_output(self.api_run_response, self._history_id, output_id)
 
-    def output_src(self, output, ignore_missing_outputs=False):
+    def output_src(self, output, ignore_missing_outputs: Optional[bool] = False):
         outputs = self.api_run_response["outputs"]
         output_collections = self.api_run_response["output_collections"]
         output_id = output.get_id()
@@ -642,7 +655,7 @@ def to_galaxy_output(self, runnable_output):
         self._ctx.vlog("checking for output in invocation [%s]" % self._invocation)
         return invocation_to_output(self._invocation, self._history_id, output_id)
 
-    def output_src(self, output, ignore_missing_outputs=False):
+    def output_src(self, output, ignore_missing_outputs: Optional[bool] = False):
         invocation = self._invocation
         # Use newer workflow outputs API.
 
diff --git a/planemo/runnable.py b/planemo/runnable.py
index 19e6027e4..9e69d7bec 100644
--- a/planemo/runnable.py
+++ b/planemo/runnable.py
@@ -587,19 +587,26 @@ def invocation_details(self):
     def log(self):
         """If engine related log is available, return as text data."""
 
+    @abc.abstractproperty
+    def outputs_dict(self):
+        """Return a dict of output descriptions."""
+
+    def get_output(self, output_id):
+        """Fetch output from engine."""
+        return self.outputs_dict.get(output_id)
+
     def structured_data(self, test_case: Optional[TestCase] = None) -> Dict[str, Any]:
         output_problems = []
         if isinstance(self, SuccessfulRunResponse) and self.was_successful:
-            outputs_dict = self.outputs_dict
             execution_problem = None
             if test_case:
                 for output_id, output_test in test_case.output_expectations.items():
-                    if output_id not in outputs_dict:
+                    output_value = self.get_output(output_id)
+                    if not output_value:
                         message = f"Expected output [{output_id}] not found in results."
                         output_problems.append(message)
                         continue
 
-                    output_value = outputs_dict[output_id]
                     output_problems.extend(test_case._check_output(output_id, output_value, output_test))
             if output_problems:
                 status = "failure"
@@ -656,10 +663,6 @@ def was_successful(self):
         """Return `True` to indicate this run was successful."""
         return True
 
-    @abc.abstractproperty
-    def outputs_dict(self):
-        """Return a dict of output descriptions."""
-
 
 class ErrorRunResponse(RunResponse):
     """Description of an error while attempting to execute a Runnable."""
@@ -709,6 +712,10 @@ def log(self):
         """Return potentially null stored `log` text."""
         return self._log
 
+    @property
+    def outputs_dict(self):
+        return {}
+
     def __str__(self):
         """Print a helpful error description of run."""
         message = f"Run failed with message [{self.error_message}]"

From 87014307e85a460f331caa8d344d022cc9cd59c4 Mon Sep 17 00:00:00 2001
From: mvdbeek <m.vandenbeek@gmail.com>
Date: Fri, 27 Oct 2023 18:39:33 +0200
Subject: [PATCH 4/7] Render invocation messages in test reports

---
 planemo/galaxy/activity.py                    |  2 +
 planemo/reports/build_report.py               | 43 +++++++++-
 planemo/reports/macros.tmpl                   | 10 +++
 planemo/reports/report_markdown.tpl           |  7 +-
 .../dataset_failed-test.yml                   |  2 +
 .../dataset_failed.yml                        | 19 +++++
 .../invalid_when_expression-test.yml          | 10 +++
 .../invalid_when_expression.yml               | 13 ++++
 .../output_not_found-test.yml                 |  5 ++
 .../output_not_found.yml                      | 15 ++++
 .../functional_test_tools/job_properties.xml  | 78 +++++++++++++++++++
 tests/test_cmd_test.py                        | 57 ++++++++++++++
 12 files changed, 258 insertions(+), 3 deletions(-)
 create mode 100644 tests/data/scheduling_failure_workflows/dataset_failed-test.yml
 create mode 100644 tests/data/scheduling_failure_workflows/dataset_failed.yml
 create mode 100644 tests/data/scheduling_failure_workflows/invalid_when_expression-test.yml
 create mode 100644 tests/data/scheduling_failure_workflows/invalid_when_expression.yml
 create mode 100644 tests/data/scheduling_failure_workflows/output_not_found-test.yml
 create mode 100644 tests/data/scheduling_failure_workflows/output_not_found.yml
 create mode 100644 tests/data/tools/functional_test_tools/job_properties.xml

diff --git a/planemo/galaxy/activity.py b/planemo/galaxy/activity.py
index 6dead53da..3547fdcf1 100644
--- a/planemo/galaxy/activity.py
+++ b/planemo/galaxy/activity.py
@@ -697,6 +697,8 @@ def collect_invocation_details(self, invocation_id=None):
                 "invocation_state": self.invocation_state,
                 "history_state": self.history_state,
                 "error_message": self.error_message,
+                # Messages are only present from 23.0 onward
+                "messages": invocation.get("messages", []),
             },
         }
         return invocation_details
diff --git a/planemo/reports/build_report.py b/planemo/reports/build_report.py
index adc0d018c..32b6f37a1 100644
--- a/planemo/reports/build_report.py
+++ b/planemo/reports/build_report.py
@@ -9,6 +9,46 @@
 
 TITLE = "Results (powered by Planemo)"
 
+cancel_fragment = "Invocation scheduling cancelled because"
+fail_fragment = "Invocation scheduling failed because"
+
+
+def render_message_to_string(invocation_message):
+    # ChatGPT did a reasonable job of translating this from https://github.com/galaxyproject/galaxy/blob/d92bbb144ffcda7e17368cf43dd25c8a9a3a7dd6/client/src/components/WorkflowInvocationState/InvocationMessage.vue#L93-L172
+    reason = invocation_message["reason"]
+    if reason == "user_request":
+        return f"{cancel_fragment} user requested cancellation."
+    elif reason == "history_deleted":
+        return f"{cancel_fragment} the history of the invocation was deleted."
+    elif reason == "cancelled_on_review":
+        return f"{cancel_fragment} the invocation was paused at step {invocation_message['workflow_step_id'] + 1} and not approved."
+    elif reason == "collection_failed":
+        return f"{fail_fragment} step {invocation_message['workflow_step_id'] + 1} requires a dataset collection created by step {invocation_message['dependent_workflow_step_id'] + 1}, but dataset collection entered a failed state."
+    elif reason == "dataset_failed":
+        if invocation_message.get("dependent_workflow_step_id") is not None:
+            return f"{fail_fragment} step {invocation_message['workflow_step_id'] + 1} requires a dataset created by step {invocation_message['dependent_workflow_step_id'] + 1}, but dataset entered a failed state."
+        else:
+            return f"{fail_fragment} step {invocation_message['workflow_step_id'] + 1} requires a dataset, but dataset entered a failed state."
+    elif reason == "job_failed":
+        return f"{fail_fragment} step {invocation_message['workflow_step_id'] + 1} depends on job(s) created in step {invocation_message['dependent_workflow_step_id'] + 1}, but a job for that step failed."
+    elif reason == "output_not_found":
+        return f"{fail_fragment} step {invocation_message['workflow_step_id'] + 1} depends on output '{invocation_message['output_name']}' of step {invocation_message['dependent_workflow_step_id'] + 1}, but this step did not produce an output of that name."
+    elif reason == "expression_evaluation_failed":
+        return f"{fail_fragment} step {invocation_message['workflow_step_id'] + 1} contains an expression that could not be evaluated."
+    elif reason == "when_not_boolean":
+        return f"{fail_fragment} step {invocation_message['workflow_step_id'] + 1} is a conditional step and the result of the when expression is not a boolean type."
+    elif reason == "unexpected_failure":
+        at_step = ""
+        if invocation_message.get("workflow_step_id") is not None:
+            at_step = f" at step {invocation_message['workflow_step_id'] + 1}"
+        if "details" in invocation_message and invocation_message["details"]:
+            return f"{fail_fragment} an unexpected failure occurred{at_step}: '{invocation_message['details']}'"
+        return f"{fail_fragment} an unexpected failure occurred{at_step}."
+    elif reason == "workflow_output_not_found":
+        return f"Defined workflow output '{invocation_message['output_name']}' was not found in step {invocation_message['workflow_step_id'] + 1}."
+    else:
+        return reason
+
 
 def build_report(structured_data, report_type="html", execution_type="Test", **kwds):
     """Use report_{report_type}.tpl to build page for report."""
@@ -19,12 +59,12 @@ def build_report(structured_data, report_type="html", execution_type="Test", **k
 
     __fix_test_ids(environment)
     environment = __inject_summary(environment)
+    environment["execution_type"] = execution_type
 
     if report_type == "html":
         # The HTML report format needs a lot of extra, custom data.
         # IMO, this seems to suggest it should be embedded.
         environment["title"] = None
-        environment["execution_type"] = execution_type
         markdown = template_data(environment, "report_markdown.tpl")
         environment["title"] = " ".join((environment["execution_type"], TITLE))
         environment["raw_data"] = base64.b64encode(markdown.encode("utf-8")).decode("utf-8")
@@ -50,6 +90,7 @@ def template_data(environment, template_name, **kwds):
         env_kwargs["trim_blocks"] = True
     env = Environment(loader=PackageLoader("planemo", "reports"), **env_kwargs)
     env.filters["strip_control_characters"] = lambda x: strip_control_characters(x) if x else x
+    env.globals["render_message_to_string"] = render_message_to_string
     template = env.get_template(template_name)
     return template.render(**environment)
 
diff --git a/planemo/reports/macros.tmpl b/planemo/reports/macros.tmpl
index dd40f95af..7edb924d2 100644
--- a/planemo/reports/macros.tmpl
+++ b/planemo/reports/macros.tmpl
@@ -65,4 +65,14 @@
    {% endif %}
 {%    endfor %}
       </details>
+{% endmacro %}
+
+
+{% macro render_invocation_messages(messages, summary_label='Invocation Messages') %}
+   * {{summary_label}}
+{%    for message in messages %}
+
+     - {{ render_message_to_string(message) }}
+
+{%    endfor %}
 {% endmacro %}
\ No newline at end of file
diff --git a/planemo/reports/report_markdown.tpl b/planemo/reports/report_markdown.tpl
index e9f104950..2888d5354 100644
--- a/planemo/reports/report_markdown.tpl
+++ b/planemo/reports/report_markdown.tpl
@@ -1,4 +1,4 @@
-{% from 'macros.tmpl' import render_invocation_details, render_job_parameters, render_steps %}
+{% from 'macros.tmpl' import render_invocation_details, render_invocation_messages, render_job_parameters, render_steps %}
 {% if title %}
 # {{ execution_type }} {{ title }}
 
@@ -32,7 +32,8 @@
 
 {% set display_job_attributes = {'command_line': 'Command Line', 'exit_code': 'Exit Code', 'stderr': 'Standard Error', 'stdout': 'Standard Output', 'traceback': 'Traceback'} %}
 {% for status, desc in {'error': 'Errored', 'failure': 'Failed', 'success': 'Passed'}.items() if state[status]%}
-<details><summary>{{ desc }} {{ execution_type }}s</summary>
+{% set expanded = "open" if status in ("error", "failure") else "" %}
+<details {{ expanded }}><summary>{{ desc }} {{ execution_type }}s</summary>
 {%   for test in raw_data.tests %}
 {%     if test.data.status == status %}
 {%       if test.data.status == 'success' %}
@@ -75,6 +76,8 @@
 
     #### Workflow invocation details
 
+{{render_invocation_messages(test.data.invocation_details.details.messages)}}
+
 {{render_steps(test.data.invocation_details.steps.values(), display_job_attributes)}}
 
 {{render_invocation_details(test.data.invocation_details.details)}}
diff --git a/tests/data/scheduling_failure_workflows/dataset_failed-test.yml b/tests/data/scheduling_failure_workflows/dataset_failed-test.yml
new file mode 100644
index 000000000..88dd44bc6
--- /dev/null
+++ b/tests/data/scheduling_failure_workflows/dataset_failed-test.yml
@@ -0,0 +1,2 @@
+- job: {}
+  outputs: {}
diff --git a/tests/data/scheduling_failure_workflows/dataset_failed.yml b/tests/data/scheduling_failure_workflows/dataset_failed.yml
new file mode 100644
index 000000000..51b61619f
--- /dev/null
+++ b/tests/data/scheduling_failure_workflows/dataset_failed.yml
@@ -0,0 +1,19 @@
+class: GalaxyWorkflow
+steps:
+  job_props:
+    tool_id: job_properties
+    state:
+      thebool: true
+      failbool: true
+  apply:
+    tool_id: __APPLY_RULES__
+    in:
+      input: job_props/list_output
+    state:
+      rules:
+        rules:
+          - type: add_column_metadata
+            value: identifier0
+        mapping:
+          - type: list_identifiers
+            columns: [0]
diff --git a/tests/data/scheduling_failure_workflows/invalid_when_expression-test.yml b/tests/data/scheduling_failure_workflows/invalid_when_expression-test.yml
new file mode 100644
index 000000000..1233e3010
--- /dev/null
+++ b/tests/data/scheduling_failure_workflows/invalid_when_expression-test.yml
@@ -0,0 +1,10 @@
+- job:
+    some_file:
+      class: File
+      path: ../hello.txt
+    should_run: true
+  outputs:
+    some_output:
+      asserts:
+        has_text:
+          text: "Hello World!"
diff --git a/tests/data/scheduling_failure_workflows/invalid_when_expression.yml b/tests/data/scheduling_failure_workflows/invalid_when_expression.yml
new file mode 100644
index 000000000..2a1586aa5
--- /dev/null
+++ b/tests/data/scheduling_failure_workflows/invalid_when_expression.yml
@@ -0,0 +1,13 @@
+class: GalaxyWorkflow
+inputs:
+  should_run:
+    type: boolean
+  some_file:
+    type: data
+steps:
+  cat1:
+    tool_id: cat1
+    in:
+      input1: some_file
+      should_run: should_run
+    when: $(:syntaxError:)
diff --git a/tests/data/scheduling_failure_workflows/output_not_found-test.yml b/tests/data/scheduling_failure_workflows/output_not_found-test.yml
new file mode 100644
index 000000000..d7934f9db
--- /dev/null
+++ b/tests/data/scheduling_failure_workflows/output_not_found-test.yml
@@ -0,0 +1,5 @@
+- job:
+    data_input:
+      path: ../hello.txt
+      class: File
+  outputs: {}
diff --git a/tests/data/scheduling_failure_workflows/output_not_found.yml b/tests/data/scheduling_failure_workflows/output_not_found.yml
new file mode 100644
index 000000000..a212bd017
--- /dev/null
+++ b/tests/data/scheduling_failure_workflows/output_not_found.yml
@@ -0,0 +1,15 @@
+class: GalaxyWorkflow
+inputs:
+  data_input: data
+steps:
+  cat1:
+    tool_id: cat1
+    in:
+      input1: data_input
+    outputs:
+      out_file1:
+        rename: "my new name"
+  first_cat1:
+    tool_id: cat1
+    in:
+      input1: cat1/does_not_exist
diff --git a/tests/data/tools/functional_test_tools/job_properties.xml b/tests/data/tools/functional_test_tools/job_properties.xml
new file mode 100644
index 000000000..19ee032ab
--- /dev/null
+++ b/tests/data/tools/functional_test_tools/job_properties.xml
@@ -0,0 +1,78 @@
+<tool id="job_properties" name="Test Job Properties" version="1.0.0">
+    <stdio>
+        <exit_code range="127" level="fatal" description="Failing exit code." />
+    </stdio>
+    <version_command>echo 'v1.1'</version_command>
+    <command><![CDATA[
+#if $thebool
+    echo 'The bool is true' &&
+    echo 'The bool is really true' 1>&2 &&
+    echo 'This is a line of text.' > '$out_file1' &&
+    cp '$out_file1' '$one' &&
+    cp '$out_file1' '$two' &&
+    sleep $sleepsecs
+#else
+    echo 'The bool is not true' &&
+    echo 'The bool is very not true' 1>&2 &&
+    echo 'This is a different line of text.' > '$out_file1' &&
+    sleep $sleepsecs &&
+    sh -c 'exit 2'
+#end if
+#if $failbool
+    ## use ';' to concatenate commands so that the next one is run independently
+    ## of the exit code of the previous one
+    ; exit 127
+#end if
+    ]]></command>
+    <inputs>
+        <param name="sleepsecs" type="integer" value="0" label="Sleep this many seconds"/>
+        <param name="thebool" type="boolean" label="The boolean property" />
+        <param name="failbool" type="boolean" label="The failure property" checked="false" />
+    </inputs>
+    <outputs>
+        <data name="out_file1" format="txt" />
+        <collection name="list_output" type="list" label="A list output">
+            <data name="one" format="txt" />
+            <data name="two" format="txt" />
+        </collection>
+    </outputs>
+    <tests>
+        <test expect_exit_code="0">
+            <param name="thebool" value="true" />
+            <output name="out_file1" file="simple_line.txt" >
+                <metadata name="data_lines" value="1" />
+            </output>
+            <assert_command>
+                <has_text text="really" />
+            </assert_command>
+            <assert_stdout>
+                <has_line line="The bool is true" />
+            </assert_stdout>
+            <assert_stderr>
+                <has_line line="The bool is really true" />
+            </assert_stderr>
+            <assert_command_version>
+                <has_text text="v1.1" />
+            </assert_command_version>
+        </test>
+        <test expect_exit_code="2">
+            <param name="thebool" value="false" />
+            <output name="out_file1" file="simple_line_alternative.txt" />
+            <assert_command>
+                <has_text text="very not" />
+            </assert_command>
+            <assert_stdout>
+                <has_line line="The bool is not true" />
+            </assert_stdout>
+            <assert_stderr>
+                <has_line line="The bool is very not true" />
+            </assert_stderr>
+        </test>
+        <test expect_exit_code="127" expect_failure="true">
+            <param name="thebool" value="true" />
+            <param name="failbool" value="true" />
+        </test>
+    </tests>
+    <help>
+    </help>
+</tool>
diff --git a/tests/test_cmd_test.py b/tests/test_cmd_test.py
index e02658514..59fcc5e09 100644
--- a/tests/test_cmd_test.py
+++ b/tests/test_cmd_test.py
@@ -18,6 +18,8 @@
     TEST_TOOLS_DIR,
 )
 
+SCHEDULING_WORKFLOWS_PATH = os.path.join(TEST_DATA_DIR, "scheduling_failure_workflows")
+FUNCTIONAL_TEST_TOOLS = os.path.join(TEST_DATA_DIR, "tools", "functional_test_tools")
 FETCH_DATA_DATA_MANAGER_TEST_PATH = "data_manager/data_manager_fetch_genome_dbkeys_all_fasta/data_manager/data_manager_fetch_genome_all_fasta_dbkeys.xml"
 BOWTIE2_DATA_MANAGER_TEST_PATH = (
     "data_manager/data_manager_bowtie2_index_builder/data_manager/bowtie2_index_builder.xml"
@@ -377,3 +379,58 @@ def test_workflow_with_identical_output_names(self):
             test_command = self.append_profile_argument_if_needed(test_command)
             test_command.append(test_artifact)
             self._check_exit_code(test_command, exit_code=0)
+
+    @skip_if_environ("PLANEMO_SKIP_GALAXY_TEST")
+    def test_scheduling_error_invalid_when_expression(self):
+        with self._isolate() as test_dir:
+            test_artifact = os.path.join(SCHEDULING_WORKFLOWS_PATH, "invalid_when_expression.yml")
+            markdown_output_path = os.path.join(test_dir, "test_output.md")
+            test_command = self._test_command()
+            test_command = self.append_profile_argument_if_needed(test_command)
+            test_command.append(test_artifact)
+            test_command.append("--test_output_markdown")
+            test_command.append(markdown_output_path)
+            self._check_exit_code(test_command, exit_code=1)
+            with open(markdown_output_path) as out:
+                markdown_content = out.read()
+            assert (
+                "Invocation scheduling failed because step 3 contains an expression that could not be evaluated"
+                in markdown_content
+            )
+
+    @skip_if_environ("PLANEMO_SKIP_GALAXY_TEST")
+    def test_scheduling_error_output_not_found(self):
+        with self._isolate() as test_dir:
+            test_artifact = os.path.join(SCHEDULING_WORKFLOWS_PATH, "output_not_found.yml")
+            markdown_output_path = os.path.join(test_dir, "test_output.md")
+            test_command = self._test_command()
+            test_command = self.append_profile_argument_if_needed(test_command)
+            test_command.append(test_artifact)
+            test_command.append("--test_output_markdown")
+            test_command.append(markdown_output_path)
+            self._check_exit_code(test_command, exit_code=1)
+            with open(markdown_output_path) as out:
+                markdown_content = out.read()
+            assert (
+                "Invocation scheduling failed because step 3 depends on output 'does_not_exist' of step 2, but this step did not produce an output of that name"
+                in markdown_content
+            )
+
+    @skip_if_environ("PLANEMO_SKIP_GALAXY_TEST")
+    def test_scheduling_error_dataset_failed(self):
+        job_properties = os.path.join(FUNCTIONAL_TEST_TOOLS, "job_properties.xml")
+        with self._isolate() as test_dir:
+            test_artifact = os.path.join(SCHEDULING_WORKFLOWS_PATH, "dataset_failed.yml")
+            markdown_output_path = os.path.join(test_dir, "test_output.md")
+            test_command = test_command = self._test_command("--extra_tools", job_properties)
+            test_command = self.append_profile_argument_if_needed(test_command)
+            test_command.append(test_artifact)
+            test_command.append("--test_output_markdown")
+            test_command.append(markdown_output_path)
+            self._check_exit_code(test_command, exit_code=1)
+            with open(markdown_output_path) as out:
+                markdown_content = out.read()
+            assert (
+                "Invocation scheduling failed because step 2 requires a dataset, but dataset entered a failed state."
+                in markdown_content
+            )

From e834939d2bbc8e9e98743722889ea458446ac8d2 Mon Sep 17 00:00:00 2001
From: mvdbeek <m.vandenbeek@gmail.com>
Date: Fri, 27 Oct 2023 18:43:59 +0200
Subject: [PATCH 5/7] Ignore complexity rule in auto-translated code

---
 planemo/reports/build_report.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/planemo/reports/build_report.py b/planemo/reports/build_report.py
index 32b6f37a1..8aaf0b77d 100644
--- a/planemo/reports/build_report.py
+++ b/planemo/reports/build_report.py
@@ -13,7 +13,7 @@
 fail_fragment = "Invocation scheduling failed because"
 
 
-def render_message_to_string(invocation_message):
+def render_message_to_string(invocation_message):  # noqa: C901
     # ChatGPT did a reasonable job of translating this from https://github.com/galaxyproject/galaxy/blob/d92bbb144ffcda7e17368cf43dd25c8a9a3a7dd6/client/src/components/WorkflowInvocationState/InvocationMessage.vue#L93-L172
     reason = invocation_message["reason"]
     if reason == "user_request":

From df01218b8da19780dee25a9bc15b50c8ab9c4244 Mon Sep 17 00:00:00 2001
From: mvdbeek <m.vandenbeek@gmail.com>
Date: Sat, 28 Oct 2023 17:33:50 +0200
Subject: [PATCH 6/7] Shorten test timeout

Maybe the shutdown takes too long if the tool still runs ?
---
 tests/data/tools/timeout.xml | 2 +-
 tests/test_cmd_test.py       | 6 +++---
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/tests/data/tools/timeout.xml b/tests/data/tools/timeout.xml
index 37c669b44..04f352da6 100644
--- a/tests/data/tools/timeout.xml
+++ b/tests/data/tools/timeout.xml
@@ -2,7 +2,7 @@
     <description>just wastes time</description>
     <command detect_errors="exit_code"><![CDATA[
         echo "output" > '$output' &&
-        sleep 30;
+        sleep 5;
     ]]></command>
     <inputs>
     </inputs>
diff --git a/tests/test_cmd_test.py b/tests/test_cmd_test.py
index 59fcc5e09..2e96bfa10 100644
--- a/tests/test_cmd_test.py
+++ b/tests/test_cmd_test.py
@@ -121,10 +121,10 @@ def test_tool_test_timeout(self):
             with open(json_out.name) as fh:
                 tool_test_json = json.load(fh)
                 assert tool_test_json["summary"]["num_tests"] == 1
-                # check run time, for smaller 10 since the test will take a bit longer than 1s
-                # the important bit is that it's not about 30s (since the test tool calls `sleep 30`)
+                # check run time, for smaller 4 since the test will take a bit longer than 1s
+                # the important bit is that it's not about 5s (since the test tool calls `sleep 5`)
                 assert (
-                    float(tool_test_json["tests"][0]["data"]["time_seconds"]) <= 10
+                    float(tool_test_json["tests"][0]["data"]["time_seconds"]) <= 4
                 ), "Test needed more than 10 sec but should time out after 1"
                 assert (
                     "Timed out after" in tool_test_json["tests"][0]["data"]["output_problems"][0]

From 11a70848d1add34b71c92528da1b9d2235aee0a2 Mon Sep 17 00:00:00 2001
From: mvdbeek <m.vandenbeek@gmail.com>
Date: Sat, 28 Oct 2023 20:13:36 +0200
Subject: [PATCH 7/7] Fix up tutorial test

---
 tests/test_training_tutorial.py | 34 ++++++++++++++-------------------
 1 file changed, 14 insertions(+), 20 deletions(-)

diff --git a/tests/test_training_tutorial.py b/tests/test_training_tutorial.py
index 04d769a95..af439fdd2 100644
--- a/tests/test_training_tutorial.py
+++ b/tests/test_training_tutorial.py
@@ -327,32 +327,26 @@ def test_tutorial_create_hands_on_tutorial() -> None:
     """Test :func:`planemo.training.tutorial.tutorial.create_hands_on_tutorial`."""
     tuto = Tutorial(training=training, topic=topic)
     os.makedirs(tuto.wf_dir)
-    # with init_wf_id and no Galaxy URL
-    tuto.init_wf_id = "ID"
-    tuto.training.galaxy_url = None
-    with pytest.raises(Exception, match="No Galaxy URL given"):
-        tuto.create_hands_on_tutorial(CTX)
-    # with init_wf_id and no Galaxy API key
-    tuto.init_wf_id = "ID"
-    tuto.training.galaxy_url = f"http://{KWDS['host']}:{KWDS['port']}"
-    tuto.training.galaxy_api_key = None
-    with pytest.raises(Exception, match="No API key to access the given Galaxy instance"):
-        tuto.create_hands_on_tutorial(CTX)
-    # with init_wf_id
     with engine_context(CTX, **KWDS) as galaxy_engine:
         assert isinstance(galaxy_engine, LocalManagedGalaxyEngine)
         with galaxy_engine.ensure_runnables_served([RUNNABLE]) as config:
+            # fail without Galaxy URL
+            tuto.init_wf_id = "ID"
+            tuto.training.galaxy_url = None
+            with pytest.raises(Exception, match="No Galaxy URL given"):
+                tuto.create_hands_on_tutorial(CTX)
+            tuto.training.galaxy_url = f"http://{KWDS['host']}:{KWDS['port']}"
             tuto.init_wf_id = config.workflow_id(WF_FP)
             tuto.training.galaxy_api_key = config.user_api_key
             tuto.create_hands_on_tutorial(CTX)
-    assert os.path.exists(tuto.tuto_fp)
-    os.remove(tuto.tuto_fp)
-    # with init_wf_fp
-    tuto.init_wf_id = None
-    tuto.init_wf_fp = WF_FP
-    tuto.create_hands_on_tutorial(CTX)
-    assert os.path.exists(tuto.tuto_fp)
-    shutil.rmtree("topics")
+            assert os.path.exists(tuto.tuto_fp)
+            os.remove(tuto.tuto_fp)
+            # with init_wf_fp
+            tuto.init_wf_id = None
+            tuto.init_wf_fp = WF_FP
+            tuto.create_hands_on_tutorial(CTX)
+            assert os.path.exists(tuto.tuto_fp)
+            shutil.rmtree("topics")
 
 
 @skip_if_environ("PLANEMO_SKIP_GALAXY_TESTS")