X-Git-Url: https://git.arvados.org/arvados.git/blobdiff_plain/970835342e02cb7a97f228f67602b7f847ab6875..5d00ecb0932f86e4d2aced3d9258b96522ef38bd:/sdk/cwl/arvados_cwl/crunch_script.py diff --git a/sdk/cwl/arvados_cwl/crunch_script.py b/sdk/cwl/arvados_cwl/crunch_script.py index 4b1b42843b..65ef50826e 100644 --- a/sdk/cwl/arvados_cwl/crunch_script.py +++ b/sdk/cwl/arvados_cwl/crunch_script.py @@ -19,10 +19,12 @@ import re import functools from arvados.api import OrderedJsonModel -from cwltool.process import shortname, adjustFileObjs, adjustDirObjs, getListing, normalizeFilesDirs +from cwltool.process import shortname, adjustFileObjs, adjustDirObjs, normalizeFilesDirs from cwltool.load_tool import load_tool from cwltool.errors import WorkflowException +from .fsaccess import CollectionFetcher, CollectionFsAccess + logger = logging.getLogger('arvados.cwl-runner') def run(): @@ -50,7 +52,8 @@ def run(): return v def keeppathObj(v): - v["location"] = keeppath(v["location"]) + if "location" in v: + v["location"] = keeppath(v["location"]) for k,v in job_order_object.items(): if isinstance(v, basestring) and arvados.util.keep_locator_pattern.match(v): @@ -62,11 +65,11 @@ def run(): adjustFileObjs(job_order_object, keeppathObj) adjustDirObjs(job_order_object, keeppathObj) normalizeFilesDirs(job_order_object) - adjustDirObjs(job_order_object, functools.partial(getListing, arvados_cwl.fsaccess.CollectionFsAccess("", api_client=api))) output_name = None output_tags = None enable_reuse = True + on_error = "continue" if "arv:output_name" in job_order_object: output_name = job_order_object["arv:output_name"] del job_order_object["arv:output_name"] @@ -79,14 +82,26 @@ def run(): enable_reuse = job_order_object["arv:enable_reuse"] del job_order_object["arv:enable_reuse"] + if "arv:on_error" in job_order_object: + on_error = job_order_object["arv:on_error"] + del job_order_object["arv:on_error"] + runner = arvados_cwl.ArvCwlRunner(api_client=arvados.api('v1', model=OrderedJsonModel()), output_name=output_name, output_tags=output_tags) - t = load_tool(toolpath, runner.arv_make_tool) + make_fs_access = functools.partial(CollectionFsAccess, + collection_cache=runner.collection_cache) + + t = load_tool(toolpath, runner.arv_make_tool, + fetcher_constructor=functools.partial(CollectionFetcher, + api_client=runner.api, + fs_access=make_fs_access(""), + num_retries=runner.num_retries)) args = argparse.Namespace() args.project_uuid = arvados.current_job()["owner_uuid"] args.enable_reuse = enable_reuse + args.on_error = on_error args.submit = False args.debug = False args.quiet = False @@ -94,7 +109,9 @@ def run(): args.basedir = os.getcwd() args.name = None args.cwl_runner_job={"uuid": arvados.current_job()["uuid"], "state": arvados.current_job()["state"]} - outputObj = runner.arv_executor(t, job_order_object, **vars(args)) + args.make_fs_access = make_fs_access + + runner.arv_executor(t, job_order_object, **vars(args)) except Exception as e: if isinstance(e, WorkflowException): logging.info("Workflow error %s", e)