nipype · djarecka · May 4, 2020 · Apr 9, 2020 · Apr 16, 2020 · Apr 22, 2020
diff --git a/pydra/engine/boutiques.py b/pydra/engine/boutiques.py
@@ -0,0 +1,221 @@
+import typing as ty
+import json
+import attr
+import subprocess as sp
+import os
+from pathlib import Path
+from functools import reduce
+
+from ..utils.messenger import AuditFlag
+from ..engine import ShellCommandTask
+from ..engine.specs import (
+    SpecInfo,
+    ShellSpec,
+    ShellOutSpec,
+    File,
+    Directory,
+    attr_fields,
+)
+from .helpers import ensure_list, execute
+from .helpers_file import template_update, is_local_file
+
+
+class BoshTask(ShellCommandTask):
+    """Shell Command Task based on the Boutiques descriptor"""
+
+    def __init__(
+        self,
+        zenodo=None,
+        bosh_file=None,
+        audit_flags: AuditFlag = AuditFlag.NONE,
+        cache_dir=None,
+        input_spec: ty.Optional[SpecInfo] = None,
+        messenger_args=None,
+        messengers=None,
+        name=None,
+        output_spec: ty.Optional[SpecInfo] = None,
+        rerun=False,
+        strip=False,
+        **kwargs,
+    ):
+        """
+        Initialize this task.
+
+        Parameters
+        ----------
+        zenodo: :obj: str
+            Zenodo ID
+        bosh_file : : str
+            json file with the boutiques descriptors
+        audit_flags : :obj:`pydra.utils.messenger.AuditFlag`
+            Auditing configuration
+        cache_dir : :obj:`os.pathlike`
+            Cache directory
+        input_spec : :obj:`pydra.engine.specs.SpecInfo`
+            Specification of inputs.
+        messenger_args :
+            TODO
+        messengers :
+            TODO
+        name : :obj:`str`
+            Name of this task.
+        output_spec : :obj:`pydra.engine.specs.BaseSpec`
+            Specification of inputs.
+        strip : :obj:`bool`
+            TODO
+
+        """
+        if (bosh_file and zenodo) or not (bosh_file or zenodo):
+            raise Exception("either bosh or zenodo has to be specified")
+        elif zenodo:
+            bosh_file = self._download_spec(zenodo)
+
+        # retry logic - an error on travis is raised randomly, not able to reproduce
+        tries, tries_max = 0, 7
+        while tries < tries_max:
+            try:
+                with bosh_file.open() as f:
+                    self.bosh_spec = json.load(f)
+                break
+            except json.decoder.JSONDecodeError:
+                tries += 1
+                if tries == tries_max:
+                    raise
+
+        if input_spec is None:
+            input_spec = self._prepare_input_spec()
+        self.input_spec = input_spec
+        if output_spec is None:
+            output_spec = self._prepare_output_spec()
+        self.output_spec = output_spec
+        self.bindings = []
+
+        super(BoshTask, self).__init__(
+            name=name,
+            input_spec=input_spec,
+            output_spec=output_spec,
+            executable=["bosh", "exec", "launch", str(bosh_file)],
+            args=["-s"],
+            audit_flags=audit_flags,
+            messengers=messengers,
+            messenger_args=messenger_args,
+            cache_dir=cache_dir,
+            strip=strip,
+            rerun=rerun,
+            **kwargs,
+        )
+        self.strip = strip
+
+    def _download_spec(self, zenodo):
+        """ usind bosh pull to download the zenodo file"""
+        spec_file = (
+            Path(os.environ["HOME"])
+            / ".cache/boutiques/production"
+            / (zenodo.replace(".", "-") + ".json")
+        )
+        for i in range(3):
+            if not spec_file.exists():
+                sp.run(["bosh", "pull", zenodo])
+        if not spec_file.exists():
+            raise Exception(f"can't pull zenodo file {zenodo}")
+        return spec_file
+
+    def _prepare_input_spec(self):
+        """ creating input spec from the zenodo file"""
+        binputs = self.bosh_spec["inputs"]
+        self._input_spec_keys = {}
+        fields = []
+        for input in binputs:
+            name = input["id"]
+            if input["type"] == "File":
+                tp = File
+            elif input["type"] == "String":
+                tp = str
+            elif input["type"] == "Number":
+                tp = float
+            elif input["type"] == "Flag":
+                tp = bool
+            else:
+                tp = None
+            # adding list
+            if tp and "list" in input and input["list"]:
+                tp = ty.List[tp]
+
+            mdata = {
+                "help_string": input.get("description", None) or input["name"],
+                "mandatory": not input["optional"],
+                "argstr": input.get("command-line-flag", None),
+            }
+            fields.append((name, tp, mdata))
+            self._input_spec_keys[input["value-key"]] = "{" + f"{name}" + "}"
+
+        spec = SpecInfo(name="Inputs", fields=fields, bases=(ShellSpec,))
+        return spec
+
+    def _prepare_output_spec(self):
+        """ creating output spec from the zenodo file"""
+        boutputs = self.bosh_spec["output-files"]
+        fields = []
+        for output in boutputs:
+            name = output["id"]
+            path_template = reduce(
+                lambda s, r: s.replace(*r),
+                self._input_spec_keys.items(),
+                output["path-template"],
+            )
+            mdata = {
+                "help_string": output.get("description", None) or output["name"],
+                "mandatory": not output["optional"],
+                "output_file_template": path_template,
+            }
+            fields.append((name, attr.ib(type=File, metadata=mdata)))
+
+        spec = SpecInfo(name="Outputs", fields=fields, bases=(ShellOutSpec,))
+        return spec
+
+    def _command_args_single(self, state_ind, ind=None):
+        """Get command line arguments for a single state"""
+        input_filepath = self._input_file(state_ind=state_ind, ind=ind)
+        cmd_list = (
+            self.inputs.executable + [input_filepath] + self.inputs.args + self.bindings
+        )
+        return cmd_list
+
+    def _input_file(self, state_ind, ind=None):
+        input_json = {}
+        for f in attr_fields(self.inputs):
+            if f.name in ["executable", "args"]:
+                continue
+            if self.state and f"{self.name}.{f.name}" in state_ind:
+                value = getattr(self.inputs, f.name)[state_ind[f"{self.name}.{f.name}"]]
+            else:
+                value = getattr(self.inputs, f.name)
+            # adding to the json file if specified by the user
+            if value is not attr.NOTHING and value != "NOTHING":
+                if is_local_file(f):
+                    value = Path(value)
+                    self.bindings.extend(["-v", f"{value.parent}:{value.parent}:ro"])
+                    value = str(value)
+
+                input_json[f.name] = value
+
+        filename = self.cache_dir / f"{self.name}-{ind}.json"
+        with open(filename, "w") as jsonfile:
+            json.dump(input_json, jsonfile)
+
+        return str(filename)
+
+    def _run_task(self):
+        self.output_ = None
+        args = self.command_args
+        if args:
+            # removing empty strings
+            args = [str(el) for el in args if el not in ["", " "]]
+            keys = ["return_code", "stdout", "stderr"]
+            values = execute(args, strip=self.strip)
+            self.output_ = dict(zip(keys, values))
+            if self.output_["return_code"]:
+                if self.output_["stderr"]:
+                    raise RuntimeError(self.output_["stderr"])
+                else:
+                    raise RuntimeError(self.output_["stdout"])
diff --git a/pydra/engine/specs.py b/pydra/engine/specs.py
@@ -311,9 +311,8 @@ def collect_additional_outputs(self, input_spec, inputs, output_dir):
                 if fld.type is File:
                     # assuming that field should have either default or metadata, but not both
                     if (
-                        not (fld.default is None or fld.default == attr.NOTHING)
-                        and fld.metadata
-                    ):
+                        fld.default is None or fld.default == attr.NOTHING
+                    ) and not fld.metadata:  # TODO: is it right?
                         raise Exception("File has to have default value or metadata")
                     elif not fld.default == attr.NOTHING:
                         additional_out[fld.name] = self._field_defaultvalue(
@@ -360,9 +359,23 @@ def _field_metadata(self, fld, inputs, output_dir):
         if "value" in fld.metadata:
             return output_dir / fld.metadata["value"]
         elif "output_file_template" in fld.metadata:
-            return output_dir / fld.metadata["output_file_template"].format(
-                **inputs.__dict__
+            sfx_tmpl = (output_dir / fld.metadata["output_file_template"]).suffixes
+            if sfx_tmpl:
+                # removing suffix from input field if template has it's own suffix
+                inputs_templ = {
+                    k: v.split(".")[0]
+                    for k, v in inputs.__dict__.items()
+                    if isinstance(v, str)
+                }
+            else:
+                inputs_templ = {
+                    k: v for k, v in inputs.__dict__.items() if isinstance(v, str)
+                }
+            out_path = output_dir / fld.metadata["output_file_template"].format(
+                **inputs_templ
             )
+            return out_path
+
         elif "callable" in fld.metadata:
             return fld.metadata["callable"](fld.name, output_dir)
         else:

diff --git a/pydra/engine/tests/data_tests/test.nii.gz b/pydra/engine/tests/data_tests/test.nii.gz
diff --git a/pydra/engine/tests/test_boutiques.py b/pydra/engine/tests/test_boutiques.py
@@ -0,0 +1,130 @@
+import os, shutil
+import subprocess as sp
+from pathlib import Path
+import pytest
+
+from ..core import Workflow
+from ..task import ShellCommandTask
+from ..submitter import Submitter
+from ..boutiques import BoshTask
+from .utils import result_no_submitter, result_submitter, no_win
+
+need_bosh_docker = pytest.mark.skipif(
+    shutil.which("docker") is None
+    or sp.call(["docker", "info"] or sp.call(["bosh", "version"])),
+    reason="requires docker and bosh",
+)
+
+if bool(shutil.which("sbatch")):
+    Plugins = ["cf", "slurm"]
+else:
+    Plugins = ["cf"]
+
+Infile = Path(__file__).resolve().parent / "data_tests" / "test.nii.gz"
+
+
+@no_win
+@need_bosh_docker
+@pytest.mark.parametrize(
+    "maskfile", ["test_brain.nii.gz", "test_brain", "test_brain.nii"]
+)
+@pytest.mark.parametrize("results_function", [result_no_submitter, result_submitter])
+@pytest.mark.parametrize("plugin", Plugins)
+def test_boutiques_1(maskfile, plugin, results_function):
+    """ simple task to run fsl.bet using BoshTask"""
+    btask = BoshTask(name="NA", zenodo="zenodo.1482743")
+    btask.inputs.infile = Infile
+    btask.inputs.maskfile = maskfile
+    res = results_function(btask, plugin)
+
+    assert res.output.return_code == 0
+
+    # checking if the outfile exists and if it has proper name
+    assert res.output.outfile.name == "test_brain.nii.gz"
+    assert res.output.outfile.exists()
+    # other files should also have proper names, but they do not exist
+    assert res.output.out_outskin_off.name == "test_brain_outskin_mesh.off"
+    assert not res.output.out_outskin_off.exists()
+
+
+@no_win
+@need_bosh_docker
+@pytest.mark.parametrize(
+    "maskfile", ["test_brain.nii.gz", "test_brain", "test_brain.nii"]
+)
+@pytest.mark.parametrize("plugin", Plugins)
+def test_boutiques_wf_1(maskfile, plugin):
+    """ wf with one task that runs fsl.bet using BoshTask"""
+    wf = Workflow(name="wf", input_spec=["maskfile", "infile"])
+    wf.inputs.maskfile = maskfile
+    wf.inputs.infile = Infile
+
+    wf.add(
+        BoshTask(
+            name="bet",
+            zenodo="zenodo.1482743",
+            infile=wf.lzin.infile,
+            maskfile=wf.lzin.maskfile,
+        )
+    )
+
+    wf.set_output([("outfile", wf.bet.lzout.outfile)])
+
+    with Submitter(plugin=plugin) as sub:
+        wf(submitter=sub)
+
+    res = wf.result()
+    assert res.output.outfile.name == "test_brain.nii.gz"
+    assert res.output.outfile.exists()
+
+
+@no_win
+@need_bosh_docker
+@pytest.mark.parametrize(
+    "maskfile", ["test_brain.nii.gz", "test_brain", "test_brain.nii"]
+)
+@pytest.mark.parametrize("plugin", Plugins)
+def test_boutiques_wf_2(maskfile, plugin):
+    """ wf with two BoshTasks (fsl.bet and fsl.stats) and one ShellTask"""
+    wf = Workflow(name="wf", input_spec=["maskfile", "infile"])
+    wf.inputs.maskfile = maskfile
+    wf.inputs.infile = Infile
+
+    wf.add(
+        BoshTask(
+            name="bet",
+            zenodo="zenodo.1482743",
+            infile=wf.lzin.infile,
+            maskfile=wf.lzin.maskfile,
+        )
+    )
+    wf.add(
+        BoshTask(
+            name="stat",
+            zenodo="zenodo.3240521",
+            input_file=wf.bet.lzout.outfile,
+            v=True,
+        )
+    )
+    wf.add(ShellCommandTask(name="cat", executable="cat", args=wf.stat.lzout.output))
+
+    wf.set_output(
+        [
+            ("outfile_bet", wf.bet.lzout.outfile),
+            ("out_stat", wf.stat.lzout.output),
+            ("out", wf.cat.lzout.stdout),
+        ]
+    )
+
+    with Submitter(plugin=plugin) as sub:
+        wf(submitter=sub)
+
+    res = wf.result()
+    assert res.output.outfile_bet.name == "test_brain.nii.gz"
+    assert res.output.outfile_bet.exists()
+
+    assert res.output.out_stat.name == "output.txt"
+    assert res.output.out_stat.exists()
+
+    assert int(res.output.out.rstrip().split()[0]) == 11534336
+    assert float(res.output.out.rstrip().split()[1]) == 11534336.0