18180: Support for requesting preemptible instances in CWL
[arvados.git] / sdk / cwl / arvados_cwl / arvcontainer.py
1 # Copyright (C) The Arvados Authors. All rights reserved.
2 #
3 # SPDX-License-Identifier: Apache-2.0
4
5 from future import standard_library
6 standard_library.install_aliases()
7 from builtins import str
8
9 import logging
10 import json
11 import os
12 import urllib.request, urllib.parse, urllib.error
13 import time
14 import datetime
15 import ciso8601
16 import uuid
17 import math
18
19 import arvados_cwl.util
20 import ruamel.yaml as yaml
21
22 from cwltool.errors import WorkflowException
23 from cwltool.process import UnsupportedRequirement, shortname
24 from cwltool.utils import aslist, adjustFileObjs, adjustDirObjs, visit_class
25 from cwltool.job import JobBase
26
27 import arvados.collection
28
29 from .arvdocker import arv_docker_get_image
30 from . import done
31 from .runner import Runner, arvados_jobs_image, packed_workflow, trim_anonymous_location, remove_redundant_fields, make_builder
32 from .fsaccess import CollectionFetcher
33 from .pathmapper import NoFollowPathMapper, trim_listing
34 from .perf import Perf
35 from ._version import __version__
36
37 logger = logging.getLogger('arvados.cwl-runner')
38 metrics = logging.getLogger('arvados.cwl-runner.metrics')
39
40 class ArvadosContainer(JobBase):
41     """Submit and manage a Crunch container request for executing a CWL CommandLineTool."""
42
43     def __init__(self, runner, job_runtime,
44                  builder,   # type: Builder
45                  joborder,  # type: Dict[Text, Union[Dict[Text, Any], List, Text]]
46                  make_path_mapper,  # type: Callable[..., PathMapper]
47                  requirements,      # type: List[Dict[Text, Text]]
48                  hints,     # type: List[Dict[Text, Text]]
49                  name       # type: Text
50     ):
51         super(ArvadosContainer, self).__init__(builder, joborder, make_path_mapper, requirements, hints, name)
52         self.arvrunner = runner
53         self.job_runtime = job_runtime
54         self.running = False
55         self.uuid = None
56
57     def update_pipeline_component(self, r):
58         pass
59
60     def _required_env(self):
61         env = {}
62         env["HOME"] = self.outdir
63         env["TMPDIR"] = self.tmpdir
64         return env
65
66     def run(self, runtimeContext):
67         # ArvadosCommandTool subclasses from cwltool.CommandLineTool,
68         # which calls makeJobRunner() to get a new ArvadosContainer
69         # object.  The fields that define execution such as
70         # command_line, environment, etc are set on the
71         # ArvadosContainer object by CommandLineTool.job() before
72         # run() is called.
73
74         runtimeContext = self.job_runtime
75
76         if runtimeContext.submit_request_uuid:
77             container_request = self.arvrunner.api.container_requests().get(
78                 uuid=runtimeContext.submit_request_uuid
79             ).execute(num_retries=self.arvrunner.num_retries)
80         else:
81             container_request = {}
82
83         container_request["command"] = self.command_line
84         container_request["name"] = self.name
85         container_request["output_path"] = self.outdir
86         container_request["cwd"] = self.outdir
87         container_request["priority"] = runtimeContext.priority
88         container_request["state"] = "Committed"
89         container_request.setdefault("properties", {})
90
91         runtime_constraints = {}
92
93         if runtimeContext.project_uuid:
94             container_request["owner_uuid"] = runtimeContext.project_uuid
95
96         if self.arvrunner.secret_store.has_secret(self.command_line):
97             raise WorkflowException("Secret material leaked on command line, only file literals may contain secrets")
98
99         if self.arvrunner.secret_store.has_secret(self.environment):
100             raise WorkflowException("Secret material leaked in environment, only file literals may contain secrets")
101
102         resources = self.builder.resources
103         if resources is not None:
104             runtime_constraints["vcpus"] = math.ceil(resources.get("cores", 1))
105             runtime_constraints["ram"] = math.ceil(resources.get("ram") * 2**20)
106
107         mounts = {
108             self.outdir: {
109                 "kind": "tmp",
110                 "capacity": math.ceil(resources.get("outdirSize", 0) * 2**20)
111             },
112             self.tmpdir: {
113                 "kind": "tmp",
114                 "capacity": math.ceil(resources.get("tmpdirSize", 0) * 2**20)
115             }
116         }
117         secret_mounts = {}
118         scheduling_parameters = {}
119
120         rf = [self.pathmapper.mapper(f) for f in self.pathmapper.referenced_files]
121         rf.sort(key=lambda k: k.resolved)
122         prevdir = None
123         for resolved, target, tp, stg in rf:
124             if not stg:
125                 continue
126             if prevdir and target.startswith(prevdir):
127                 continue
128             if tp == "Directory":
129                 targetdir = target
130             else:
131                 targetdir = os.path.dirname(target)
132             sp = resolved.split("/", 1)
133             pdh = sp[0][5:]   # remove "keep:"
134             mounts[targetdir] = {
135                 "kind": "collection",
136                 "portable_data_hash": pdh
137             }
138             if pdh in self.pathmapper.pdh_to_uuid:
139                 mounts[targetdir]["uuid"] = self.pathmapper.pdh_to_uuid[pdh]
140             if len(sp) == 2:
141                 if tp == "Directory":
142                     path = sp[1]
143                 else:
144                     path = os.path.dirname(sp[1])
145                 if path and path != "/":
146                     mounts[targetdir]["path"] = path
147             prevdir = targetdir + "/"
148
149         with Perf(metrics, "generatefiles %s" % self.name):
150             if self.generatefiles["listing"]:
151                 vwd = arvados.collection.Collection(api_client=self.arvrunner.api,
152                                                     keep_client=self.arvrunner.keep_client,
153                                                     num_retries=self.arvrunner.num_retries)
154                 generatemapper = NoFollowPathMapper(self.generatefiles["listing"], "", "",
155                                                     separateDirs=False)
156
157                 sorteditems = sorted(generatemapper.items(), key=lambda n: n[1].target)
158
159                 logger.debug("generatemapper is %s", sorteditems)
160
161                 with Perf(metrics, "createfiles %s" % self.name):
162                     for f, p in sorteditems:
163                         if not p.target:
164                             continue
165
166                         if p.target.startswith("/"):
167                             dst = p.target[len(self.outdir)+1:] if p.target.startswith(self.outdir+"/") else p.target[1:]
168                         else:
169                             dst = p.target
170
171                         if p.type in ("File", "Directory", "WritableFile", "WritableDirectory"):
172                             if p.resolved.startswith("_:"):
173                                 vwd.mkdirs(dst)
174                             else:
175                                 source, path = self.arvrunner.fs_access.get_collection(p.resolved)
176                                 vwd.copy(path or ".", dst, source_collection=source)
177                         elif p.type == "CreateFile":
178                             if self.arvrunner.secret_store.has_secret(p.resolved):
179                                 mountpoint = p.target if p.target.startswith("/") else os.path.join(self.outdir, p.target)
180                                 secret_mounts[mountpoint] = {
181                                     "kind": "text",
182                                     "content": self.arvrunner.secret_store.retrieve(p.resolved)
183                                 }
184                             else:
185                                 with vwd.open(dst, "w") as n:
186                                     n.write(p.resolved)
187
188                 def keepemptydirs(p):
189                     if isinstance(p, arvados.collection.RichCollectionBase):
190                         if len(p) == 0:
191                             p.open(".keep", "w").close()
192                         else:
193                             for c in p:
194                                 keepemptydirs(p[c])
195
196                 keepemptydirs(vwd)
197
198                 if not runtimeContext.current_container:
199                     runtimeContext.current_container = arvados_cwl.util.get_current_container(self.arvrunner.api, self.arvrunner.num_retries, logger)
200                 info = arvados_cwl.util.get_intermediate_collection_info(self.name, runtimeContext.current_container, runtimeContext.intermediate_output_ttl)
201                 vwd.save_new(name=info["name"],
202                              owner_uuid=runtimeContext.project_uuid,
203                              ensure_unique_name=True,
204                              trash_at=info["trash_at"],
205                              properties=info["properties"])
206
207                 prev = None
208                 for f, p in sorteditems:
209                     if (not p.target or self.arvrunner.secret_store.has_secret(p.resolved) or
210                         (prev is not None and p.target.startswith(prev))):
211                         continue
212                     if p.target.startswith("/"):
213                         dst = p.target[len(self.outdir)+1:] if p.target.startswith(self.outdir+"/") else p.target[1:]
214                     else:
215                         dst = p.target
216                     mountpoint = p.target if p.target.startswith("/") else os.path.join(self.outdir, p.target)
217                     mounts[mountpoint] = {"kind": "collection",
218                                           "portable_data_hash": vwd.portable_data_hash(),
219                                           "path": dst}
220                     if p.type.startswith("Writable"):
221                         mounts[mountpoint]["writable"] = True
222                     prev = p.target + "/"
223
224         container_request["environment"] = {"TMPDIR": self.tmpdir, "HOME": self.outdir}
225         if self.environment:
226             container_request["environment"].update(self.environment)
227
228         if self.stdin:
229             sp = self.stdin[6:].split("/", 1)
230             mounts["stdin"] = {"kind": "collection",
231                                 "portable_data_hash": sp[0],
232                                 "path": sp[1]}
233
234         if self.stderr:
235             mounts["stderr"] = {"kind": "file",
236                                 "path": "%s/%s" % (self.outdir, self.stderr)}
237
238         if self.stdout:
239             mounts["stdout"] = {"kind": "file",
240                                 "path": "%s/%s" % (self.outdir, self.stdout)}
241
242         (docker_req, docker_is_req) = self.get_requirement("DockerRequirement")
243
244         container_request["container_image"] = arv_docker_get_image(self.arvrunner.api,
245                                                                     docker_req,
246                                                                     runtimeContext.pull_image,
247                                                                     runtimeContext.project_uuid,
248                                                                     runtimeContext.force_docker_pull,
249                                                                     runtimeContext.tmp_outdir_prefix,
250                                                                     runtimeContext.match_local_docker)
251
252         network_req, _ = self.get_requirement("NetworkAccess")
253         if network_req:
254             runtime_constraints["API"] = network_req["networkAccess"]
255
256         api_req, _ = self.get_requirement("http://arvados.org/cwl#APIRequirement")
257         if api_req:
258             runtime_constraints["API"] = True
259
260         runtime_req, _ = self.get_requirement("http://arvados.org/cwl#RuntimeConstraints")
261         if runtime_req:
262             if "keep_cache" in runtime_req:
263                 runtime_constraints["keep_cache_ram"] = math.ceil(runtime_req["keep_cache"] * 2**20)
264             if "outputDirType" in runtime_req:
265                 if runtime_req["outputDirType"] == "local_output_dir":
266                     # Currently the default behavior.
267                     pass
268                 elif runtime_req["outputDirType"] == "keep_output_dir":
269                     mounts[self.outdir]= {
270                         "kind": "collection",
271                         "writable": True
272                     }
273
274         partition_req, _ = self.get_requirement("http://arvados.org/cwl#PartitionRequirement")
275         if partition_req:
276             scheduling_parameters["partitions"] = aslist(partition_req["partition"])
277
278         intermediate_output_req, _ = self.get_requirement("http://arvados.org/cwl#IntermediateOutput")
279         if intermediate_output_req:
280             self.output_ttl = intermediate_output_req["outputTTL"]
281         else:
282             self.output_ttl = self.arvrunner.intermediate_output_ttl
283
284         if self.output_ttl < 0:
285             raise WorkflowException("Invalid value %d for output_ttl, cannot be less than zero" % container_request["output_ttl"])
286
287
288         if self.arvrunner.api._rootDesc["revision"] >= "20210628":
289             storage_class_req, _ = self.get_requirement("http://arvados.org/cwl#OutputStorageClass")
290             if storage_class_req and storage_class_req.get("intermediateStorageClass"):
291                 container_request["output_storage_classes"] = aslist(storage_class_req["intermediateStorageClass"])
292             else:
293                 container_request["output_storage_classes"] = runtimeContext.intermediate_storage_classes.strip().split(",")
294
295         cuda_req, _ = self.get_requirement("http://commonwl.org/cwltool#CUDARequirement")
296         if cuda_req:
297             runtime_constraints["cuda"] = {
298                 "device_count": resources.get("cudaDeviceCount", 1),
299                 "driver_version": cuda_req["cudaVersionMin"],
300                 "hardware_capability": aslist(cuda_req["cudaComputeCapability"])[0]
301             }
302
303         if runtimeContext.enable_preemptible is False:
304             scheduling_parameters["preemptible"] = False
305         else:
306             preemptible_req, _ = self.get_requirement("http://arvados.org/cwl#UsePreemptible")
307             if preemptible_req:
308                 scheduling_parameters["preemptible"] = preemptible_req["usePreemptible"]
309             elif runtimeContext.enable_preemptible is True:
310                 scheduling_parameters["preemptible"] = True
311             elif runtimeContext.enable_preemptible is None:
312                 pass
313
314         if self.timelimit is not None and self.timelimit > 0:
315             scheduling_parameters["max_run_time"] = self.timelimit
316
317         extra_submit_params = {}
318         if runtimeContext.submit_runner_cluster:
319             extra_submit_params["cluster_id"] = runtimeContext.submit_runner_cluster
320
321         container_request["output_name"] = "Output for step %s" % (self.name)
322         container_request["output_ttl"] = self.output_ttl
323         container_request["mounts"] = mounts
324         container_request["secret_mounts"] = secret_mounts
325         container_request["runtime_constraints"] = runtime_constraints
326         container_request["scheduling_parameters"] = scheduling_parameters
327
328         enable_reuse = runtimeContext.enable_reuse
329         if enable_reuse:
330             reuse_req, _ = self.get_requirement("WorkReuse")
331             if reuse_req:
332                 enable_reuse = reuse_req["enableReuse"]
333             reuse_req, _ = self.get_requirement("http://arvados.org/cwl#ReuseRequirement")
334             if reuse_req:
335                 enable_reuse = reuse_req["enableReuse"]
336         container_request["use_existing"] = enable_reuse
337
338         properties_req, _ = self.get_requirement("http://arvados.org/cwl#ProcessProperties")
339         if properties_req:
340             for pr in properties_req["processProperties"]:
341                 container_request["properties"][pr["propertyName"]] = self.builder.do_eval(pr["propertyValue"])
342
343         if runtimeContext.runnerjob.startswith("arvwf:"):
344             wfuuid = runtimeContext.runnerjob[6:runtimeContext.runnerjob.index("#")]
345             wfrecord = self.arvrunner.api.workflows().get(uuid=wfuuid).execute(num_retries=self.arvrunner.num_retries)
346             if container_request["name"] == "main":
347                 container_request["name"] = wfrecord["name"]
348             container_request["properties"]["template_uuid"] = wfuuid
349
350         self.output_callback = self.arvrunner.get_wrapped_callback(self.output_callback)
351
352         try:
353             if runtimeContext.submit_request_uuid:
354                 response = self.arvrunner.api.container_requests().update(
355                     uuid=runtimeContext.submit_request_uuid,
356                     body=container_request,
357                     **extra_submit_params
358                 ).execute(num_retries=self.arvrunner.num_retries)
359             else:
360                 response = self.arvrunner.api.container_requests().create(
361                     body=container_request,
362                     **extra_submit_params
363                 ).execute(num_retries=self.arvrunner.num_retries)
364
365             self.uuid = response["uuid"]
366             self.arvrunner.process_submitted(self)
367
368             if response["state"] == "Final":
369                 logger.info("%s reused container %s", self.arvrunner.label(self), response["container_uuid"])
370             else:
371                 logger.info("%s %s state is %s", self.arvrunner.label(self), response["uuid"], response["state"])
372         except Exception as e:
373             logger.exception("%s error submitting container\n%s", self.arvrunner.label(self), e)
374             logger.debug("Container request was %s", container_request)
375             self.output_callback({}, "permanentFail")
376
377     def done(self, record):
378         outputs = {}
379         try:
380             container = self.arvrunner.api.containers().get(
381                 uuid=record["container_uuid"]
382             ).execute(num_retries=self.arvrunner.num_retries)
383             if container["state"] == "Complete":
384                 rcode = container["exit_code"]
385                 if self.successCodes and rcode in self.successCodes:
386                     processStatus = "success"
387                 elif self.temporaryFailCodes and rcode in self.temporaryFailCodes:
388                     processStatus = "temporaryFail"
389                 elif self.permanentFailCodes and rcode in self.permanentFailCodes:
390                     processStatus = "permanentFail"
391                 elif rcode == 0:
392                     processStatus = "success"
393                 else:
394                     processStatus = "permanentFail"
395             else:
396                 processStatus = "permanentFail"
397
398             if processStatus == "permanentFail" and record["log_uuid"]:
399                 logc = arvados.collection.CollectionReader(record["log_uuid"],
400                                                            api_client=self.arvrunner.api,
401                                                            keep_client=self.arvrunner.keep_client,
402                                                            num_retries=self.arvrunner.num_retries)
403                 label = self.arvrunner.label(self)
404                 done.logtail(
405                     logc, logger.error,
406                     "%s (%s) error log:" % (label, record["uuid"]), maxlen=40)
407
408             if record["output_uuid"]:
409                 if self.arvrunner.trash_intermediate or self.arvrunner.intermediate_output_ttl:
410                     # Compute the trash time to avoid requesting the collection record.
411                     trash_at = ciso8601.parse_datetime_as_naive(record["modified_at"]) + datetime.timedelta(0, self.arvrunner.intermediate_output_ttl)
412                     aftertime = " at %s" % trash_at.strftime("%Y-%m-%d %H:%M:%S UTC") if self.arvrunner.intermediate_output_ttl else ""
413                     orpart = ", or" if self.arvrunner.trash_intermediate and self.arvrunner.intermediate_output_ttl else ""
414                     oncomplete = " upon successful completion of the workflow" if self.arvrunner.trash_intermediate else ""
415                     logger.info("%s Intermediate output %s (%s) will be trashed%s%s%s." % (
416                         self.arvrunner.label(self), record["output_uuid"], container["output"], aftertime, orpart, oncomplete))
417                 self.arvrunner.add_intermediate_output(record["output_uuid"])
418
419             if container["output"]:
420                 outputs = done.done_outputs(self, container, "/tmp", self.outdir, "/keep")
421         except WorkflowException as e:
422             # Only include a stack trace if in debug mode.
423             # A stack trace may obfuscate more useful output about the workflow.
424             logger.error("%s unable to collect output from %s:\n%s",
425                          self.arvrunner.label(self), container["output"], e, exc_info=(e if self.arvrunner.debug else False))
426             processStatus = "permanentFail"
427         except Exception:
428             logger.exception("%s while getting output object:", self.arvrunner.label(self))
429             processStatus = "permanentFail"
430         finally:
431             self.output_callback(outputs, processStatus)
432
433
434 class RunnerContainer(Runner):
435     """Submit and manage a container that runs arvados-cwl-runner."""
436
437     def arvados_job_spec(self, runtimeContext):
438         """Create an Arvados container request for this workflow.
439
440         The returned dict can be used to create a container passed as
441         the +body+ argument to container_requests().create().
442         """
443
444         adjustDirObjs(self.job_order, trim_listing)
445         visit_class(self.job_order, ("File", "Directory"), trim_anonymous_location)
446         visit_class(self.job_order, ("File", "Directory"), remove_redundant_fields)
447
448         secret_mounts = {}
449         for param in sorted(self.job_order.keys()):
450             if self.secret_store.has_secret(self.job_order[param]):
451                 mnt = "/secrets/s%d" % len(secret_mounts)
452                 secret_mounts[mnt] = {
453                     "kind": "text",
454                     "content": self.secret_store.retrieve(self.job_order[param])
455                 }
456                 self.job_order[param] = {"$include": mnt}
457
458         container_req = {
459             "name": self.name,
460             "output_path": "/var/spool/cwl",
461             "cwd": "/var/spool/cwl",
462             "priority": self.priority,
463             "state": "Committed",
464             "container_image": arvados_jobs_image(self.arvrunner, self.jobs_image),
465             "mounts": {
466                 "/var/lib/cwl/cwl.input.json": {
467                     "kind": "json",
468                     "content": self.job_order
469                 },
470                 "stdout": {
471                     "kind": "file",
472                     "path": "/var/spool/cwl/cwl.output.json"
473                 },
474                 "/var/spool/cwl": {
475                     "kind": "collection",
476                     "writable": True
477                 }
478             },
479             "secret_mounts": secret_mounts,
480             "runtime_constraints": {
481                 "vcpus": math.ceil(self.submit_runner_cores),
482                 "ram": 1024*1024 * (math.ceil(self.submit_runner_ram) + math.ceil(self.collection_cache_size)),
483                 "API": True
484             },
485             "use_existing": False, # Never reuse the runner container - see #15497.
486             "properties": {}
487         }
488
489         if self.embedded_tool.tool.get("id", "").startswith("keep:"):
490             sp = self.embedded_tool.tool["id"].split('/')
491             workflowcollection = sp[0][5:]
492             workflowname = "/".join(sp[1:])
493             workflowpath = "/var/lib/cwl/workflow/%s" % workflowname
494             container_req["mounts"]["/var/lib/cwl/workflow"] = {
495                 "kind": "collection",
496                 "portable_data_hash": "%s" % workflowcollection
497             }
498         else:
499             packed = packed_workflow(self.arvrunner, self.embedded_tool, self.merged_map)
500             workflowpath = "/var/lib/cwl/workflow.json#main"
501             container_req["mounts"]["/var/lib/cwl/workflow.json"] = {
502                 "kind": "json",
503                 "content": packed
504             }
505             if self.embedded_tool.tool.get("id", "").startswith("arvwf:"):
506                 container_req["properties"]["template_uuid"] = self.embedded_tool.tool["id"][6:33]
507
508         properties_req, _ = self.embedded_tool.get_requirement("http://arvados.org/cwl#ProcessProperties")
509         if properties_req:
510             builder = make_builder(self.job_order, self.embedded_tool.hints, self.embedded_tool.requirements, runtimeContext, self.embedded_tool.metadata)
511             for pr in properties_req["processProperties"]:
512                 container_req["properties"][pr["propertyName"]] = builder.do_eval(pr["propertyValue"])
513
514         # --local means execute the workflow instead of submitting a container request
515         # --api=containers means use the containers API
516         # --no-log-timestamps means don't add timestamps (the logging infrastructure does this)
517         # --disable-validate because we already validated so don't need to do it again
518         # --eval-timeout is the timeout for javascript invocation
519         # --parallel-task-count is the number of threads to use for job submission
520         # --enable/disable-reuse sets desired job reuse
521         # --collection-cache-size sets aside memory to store collections
522         command = ["arvados-cwl-runner",
523                    "--local",
524                    "--api=containers",
525                    "--no-log-timestamps",
526                    "--disable-validate",
527                    "--disable-color",
528                    "--eval-timeout=%s" % self.arvrunner.eval_timeout,
529                    "--thread-count=%s" % self.arvrunner.thread_count,
530                    "--enable-reuse" if self.enable_reuse else "--disable-reuse",
531                    "--collection-cache-size=%s" % self.collection_cache_size]
532
533         if self.output_name:
534             command.append("--output-name=" + self.output_name)
535             container_req["output_name"] = self.output_name
536
537         if self.output_tags:
538             command.append("--output-tags=" + self.output_tags)
539
540         if runtimeContext.debug:
541             command.append("--debug")
542
543         if runtimeContext.storage_classes != "default" and runtimeContext.storage_classes:
544             command.append("--storage-classes=" + runtimeContext.storage_classes)
545
546         if runtimeContext.intermediate_storage_classes != "default" and runtimeContext.intermediate_storage_classes:
547             command.append("--intermediate-storage-classes=" + runtimeContext.intermediate_storage_classes)
548
549         if self.on_error:
550             command.append("--on-error=" + self.on_error)
551
552         if self.intermediate_output_ttl:
553             command.append("--intermediate-output-ttl=%d" % self.intermediate_output_ttl)
554
555         if self.arvrunner.trash_intermediate:
556             command.append("--trash-intermediate")
557
558         if self.arvrunner.project_uuid:
559             command.append("--project-uuid="+self.arvrunner.project_uuid)
560
561         if self.enable_dev:
562             command.append("--enable-dev")
563
564         if runtimeContext.enable_preemptible is True:
565             command.append("--enable-preemptible")
566
567         if runtimeContext.enable_preemptible is False:
568             command.append("--disable-preemptible")
569
570         command.extend([workflowpath, "/var/lib/cwl/cwl.input.json"])
571
572         container_req["command"] = command
573
574         return container_req
575
576
577     def run(self, runtimeContext):
578         runtimeContext.keepprefix = "keep:"
579         job_spec = self.arvados_job_spec(runtimeContext)
580         if self.arvrunner.project_uuid:
581             job_spec["owner_uuid"] = self.arvrunner.project_uuid
582
583         extra_submit_params = {}
584         if runtimeContext.submit_runner_cluster:
585             extra_submit_params["cluster_id"] = runtimeContext.submit_runner_cluster
586
587         if runtimeContext.submit_request_uuid:
588             if "cluster_id" in extra_submit_params:
589                 # Doesn't make sense for "update" and actually fails
590                 del extra_submit_params["cluster_id"]
591             response = self.arvrunner.api.container_requests().update(
592                 uuid=runtimeContext.submit_request_uuid,
593                 body=job_spec,
594                 **extra_submit_params
595             ).execute(num_retries=self.arvrunner.num_retries)
596         else:
597             response = self.arvrunner.api.container_requests().create(
598                 body=job_spec,
599                 **extra_submit_params
600             ).execute(num_retries=self.arvrunner.num_retries)
601
602         self.uuid = response["uuid"]
603         self.arvrunner.process_submitted(self)
604
605         logger.info("%s submitted container_request %s", self.arvrunner.label(self), response["uuid"])
606
607         workbench1 = self.arvrunner.api.config()["Services"]["Workbench1"]["ExternalURL"]
608         workbench2 = self.arvrunner.api.config()["Services"]["Workbench2"]["ExternalURL"]
609         url = ""
610         if workbench2:
611             url = "{}processes/{}".format(workbench2, response["uuid"])
612         elif workbench1:
613             url = "{}container_requests/{}".format(workbench1, response["uuid"])
614         if url:
615             logger.info("Monitor workflow progress at %s", url)
616
617
618     def done(self, record):
619         try:
620             container = self.arvrunner.api.containers().get(
621                 uuid=record["container_uuid"]
622             ).execute(num_retries=self.arvrunner.num_retries)
623             container["log"] = record["log_uuid"]
624         except Exception:
625             logger.exception("%s while getting runner container", self.arvrunner.label(self))
626             self.arvrunner.output_callback({}, "permanentFail")
627         else:
628             super(RunnerContainer, self).done(container)