X-Git-Url: https://git.arvados.org/arvados.git/blobdiff_plain/3b4da80a23136c0cec743ee4cdad9b22b51ac3e0..b9fd7e3f374248a61159e4750a84e38d1c48d5dd:/sdk/cwl/arvados_cwl/arvtool.py diff --git a/sdk/cwl/arvados_cwl/arvtool.py b/sdk/cwl/arvados_cwl/arvtool.py index 8268300e75..704edaccb9 100644 --- a/sdk/cwl/arvados_cwl/arvtool.py +++ b/sdk/cwl/arvados_cwl/arvtool.py @@ -2,57 +2,82 @@ # # SPDX-License-Identifier: Apache-2.0 -from cwltool.command_line_tool import CommandLineTool -from .arvjob import ArvadosJob +from cwltool.command_line_tool import CommandLineTool, ExpressionTool from .arvcontainer import ArvadosContainer from .pathmapper import ArvPathMapper +from .runner import make_builder +from functools import partial +from schema_salad.sourceline import SourceLine +from cwltool.errors import WorkflowException + +def validate_cluster_target(arvrunner, runtimeContext): + if (runtimeContext.submit_runner_cluster and + runtimeContext.submit_runner_cluster not in arvrunner.api._rootDesc["remoteHosts"] and + runtimeContext.submit_runner_cluster != arvrunner.api._rootDesc["uuidPrefix"]): + raise WorkflowException("Unknown or invalid cluster id '%s' known remote clusters are %s" % (runtimeContext.submit_runner_cluster, + ", ".join(list(arvrunner.api._rootDesc["remoteHosts"].keys())))) +def set_cluster_target(tool, arvrunner, builder, runtimeContext): + cluster_target_req = None + for field in ("hints", "requirements"): + if field not in tool: + continue + for item in tool[field]: + if item["class"] == "http://arvados.org/cwl#ClusterTarget": + cluster_target_req = item + + if cluster_target_req is None: + return runtimeContext + + with SourceLine(cluster_target_req, None, WorkflowException, runtimeContext.debug): + runtimeContext = runtimeContext.copy() + runtimeContext.submit_runner_cluster = builder.do_eval(cluster_target_req.get("cluster_id")) or runtimeContext.submit_runner_cluster + runtimeContext.project_uuid = builder.do_eval(cluster_target_req.get("project_uuid")) or runtimeContext.project_uuid + validate_cluster_target(arvrunner, runtimeContext) + + return runtimeContext + class ArvadosCommandTool(CommandLineTool): """Wrap cwltool CommandLineTool to override selected methods.""" - def __init__(self, arvrunner, toolpath_object, **kwargs): - super(ArvadosCommandTool, self).__init__(toolpath_object, **kwargs) + def __init__(self, arvrunner, toolpath_object, loadingContext): + super(ArvadosCommandTool, self).__init__(toolpath_object, loadingContext) self.arvrunner = arvrunner - self.work_api = kwargs["work_api"] - - def makeJobRunner(self, **kwargs): - if self.work_api == "containers": - return ArvadosContainer(self.arvrunner) - elif self.work_api == "jobs": - return ArvadosJob(self.arvrunner) - - def makePathMapper(self, reffiles, stagedir, **kwargs): - # type: (List[Any], unicode, **Any) -> PathMapper - if self.work_api == "containers": - return ArvPathMapper(self.arvrunner, reffiles+kwargs.get("extra_reffiles", []), kwargs["basedir"], + + def make_job_runner(self, runtimeContext): + if runtimeContext.work_api == "containers": + return partial(ArvadosContainer, self.arvrunner, runtimeContext) + else: + raise Exception("Unsupported work_api %s", runtimeContext.work_api) + + def make_path_mapper(self, reffiles, stagedir, runtimeContext, separateDirs): + if runtimeContext.work_api == "containers": + return ArvPathMapper(self.arvrunner, reffiles+runtimeContext.extra_reffiles, runtimeContext.basedir, "/keep/%s", - "/keep/%s/%s", - **kwargs) - elif self.work_api == "jobs": - return ArvPathMapper(self.arvrunner, reffiles, kwargs["basedir"], - "$(task.keep)/%s", - "$(task.keep)/%s/%s", - **kwargs) - - def job(self, joborder, output_callback, **kwargs): - - # Workaround for #13365 - builderargs = kwargs.copy() - builderargs["toplevel"] = True - builder = self._init_job(joborder, **builderargs) - joborder = builder.job - - if self.work_api == "containers": + "/keep/%s/%s") + + def job(self, joborder, output_callback, runtimeContext): + builder = make_builder(joborder, self.hints, self.requirements, runtimeContext) + runtimeContext = set_cluster_target(self.tool, self.arvrunner, builder, runtimeContext) + + if runtimeContext.work_api == "containers": dockerReq, is_req = self.get_requirement("DockerRequirement") if dockerReq and dockerReq.get("dockerOutputDirectory"): - kwargs["outdir"] = dockerReq.get("dockerOutputDirectory") - kwargs["docker_outdir"] = dockerReq.get("dockerOutputDirectory") + runtimeContext.outdir = dockerReq.get("dockerOutputDirectory") + runtimeContext.docker_outdir = dockerReq.get("dockerOutputDirectory") else: - kwargs["outdir"] = "/var/spool/cwl" - kwargs["docker_outdir"] = "/var/spool/cwl" - elif self.work_api == "jobs": - kwargs["outdir"] = "$(task.outdir)" - kwargs["docker_outdir"] = "$(task.outdir)" - kwargs["tmpdir"] = "$(task.tmpdir)" - kwargs["docker_tmpdir"] = "$(task.tmpdir)" - return super(ArvadosCommandTool, self).job(joborder, output_callback, **kwargs) + runtimeContext.outdir = "/var/spool/cwl" + runtimeContext.docker_outdir = "/var/spool/cwl" + return super(ArvadosCommandTool, self).job(joborder, output_callback, runtimeContext) + +class ArvadosExpressionTool(ExpressionTool): + def __init__(self, arvrunner, toolpath_object, loadingContext): + super(ArvadosExpressionTool, self).__init__(toolpath_object, loadingContext) + self.arvrunner = arvrunner + + def job(self, + job_order, # type: Mapping[Text, Text] + output_callback, # type: Callable[[Any, Any], Any] + runtimeContext # type: RuntimeContext + ): + return super(ArvadosExpressionTool, self).job(job_order, self.arvrunner.get_wrapped_callback(output_callback), runtimeContext)