X-Git-Url: https://git.arvados.org/arvados.git/blobdiff_plain/adc0f36eeab40f4b8e0603247392b3c804d7272a..09cbdc3074b3f1e69c9c537875146f6da0a6ed8f:/sdk/cwl/arvados_cwl/pathmapper.py diff --git a/sdk/cwl/arvados_cwl/pathmapper.py b/sdk/cwl/arvados_cwl/pathmapper.py index a5dd5ccf39..e2e287bf1d 100644 --- a/sdk/cwl/arvados_cwl/pathmapper.py +++ b/sdk/cwl/arvados_cwl/pathmapper.py @@ -105,9 +105,15 @@ class ArvPathMapper(PathMapper): raise WorkflowException("Directory literal '%s' is missing `listing`" % src) elif src.startswith("http:") or src.startswith("https:"): try: - keepref = http_to_keep(self.arvrunner.api, self.arvrunner.project_uuid, src) - logger.info("%s is %s", src, keepref) - self._pathmap[src] = MapperEnt(keepref, keepref, srcobj["class"], True) + if self.arvrunner.defer_downloads: + # passthrough, we'll download it later. + self._pathmap[src] = MapperEnt(src, src, srcobj["class"], True) + else: + keepref = http_to_keep(self.arvrunner.api, self.arvrunner.project_uuid, src, + varying_url_params=self.arvrunner.toplevel_runtimeContext.varying_url_params, + prefer_cached_downloads=self.arvrunner.toplevel_runtimeContext.prefer_cached_downloads) + logger.info("%s is %s", src, keepref) + self._pathmap[src] = MapperEnt(keepref, keepref, srcobj["class"], True) except Exception as e: logger.warning(str(e)) else: @@ -156,16 +162,26 @@ class ArvPathMapper(PathMapper): if loc.startswith("_:"): return True - if not prefix: - i = loc.rfind("/") - if i > -1: - prefix = loc[:i+1] - suffix = urllib.parse.quote(urllib.parse.unquote(loc[i+1:]), "/+@") - else: - prefix = loc+"/" - suffix = "" + if self.arvrunner.defer_downloads and (loc.startswith("http:") or loc.startswith("https:")): + return False + + i = loc.rfind("/") + if i > -1: + loc_prefix = loc[:i+1] + if not prefix: + prefix = loc_prefix + # quote/unquote to ensure consistent quoting + suffix = urllib.parse.quote(urllib.parse.unquote(loc[i+1:]), "/+@") + else: + # no '/' found + loc_prefix = loc+"/" + prefix = loc+"/" + suffix = "" + + if prefix != loc_prefix: + return True - if prefix+suffix != prefix+urllib.parse.quote(srcobj["basename"], "/+@"): + if "basename" in srcobj and suffix != urllib.parse.quote(srcobj["basename"], "/+@"): return True if srcobj["class"] == "File" and loc not in self._pathmap: @@ -174,7 +190,7 @@ class ArvPathMapper(PathMapper): if self.needs_new_collection(s, prefix): return True if srcobj.get("listing"): - prefix = "%s%s/" % (prefix, srcobj["basename"]) + prefix = "%s%s/" % (prefix, urllib.parse.quote(srcobj.get("basename", suffix), "/+@")) for l in srcobj["listing"]: if self.needs_new_collection(l, prefix): return True