X-Git-Url: https://git.arvados.org/arvados.git/blobdiff_plain/3e443d57aaecd34e63a8d861c7075ab7b0f61174..c51634cad3c68d0a8400f1b1c47da9eef5307e06:/sdk/python/arvados/collection.py diff --git a/sdk/python/arvados/collection.py b/sdk/python/arvados/collection.py index 400a88c5f2..496136ebe3 100644 --- a/sdk/python/arvados/collection.py +++ b/sdk/python/arvados/collection.py @@ -92,13 +92,16 @@ def normalize(collection): class CollectionReader(object): - def __init__(self, manifest_locator_or_text, api_client=None): + def __init__(self, manifest_locator_or_text, api_client=None, keep_client=None): self._api_client = api_client - self._keep_client = None + self._keep_client = keep_client if re.match(r'[a-f0-9]{32}(\+\d+)?(\+\S+)*$', manifest_locator_or_text): self._manifest_locator = manifest_locator_or_text self._manifest_text = None - elif re.match(r'(\S+)( [a-f0-9]{32}(\+\d+)(\+\S+)*)+( \d+:\d+:\S+)+\n', manifest_locator_or_text): + elif re.match(r'[a-z0-9]{5}-[a-z0-9]{5}-[a-z0-9]{15}$', manifest_locator_or_text): + self._manifest_locator = manifest_locator_or_text + self._manifest_text = None + elif re.match(r'((\S+)( +[a-f0-9]{32}(\+\d+)(\+\S+)*)+( +\d+:\d+:\S+)+$)+', manifest_locator_or_text, re.MULTILINE): self._manifest_text = manifest_locator_or_text self._manifest_locator = None else: @@ -132,6 +135,9 @@ class CollectionReader(object): uuid=self._manifest_locator).execute() self._manifest_text = c['manifest_text'] except Exception as e: + if not util.portable_data_hash_pattern.match( + self._manifest_locator): + raise _logger.warning("API lookup failed for collection %s (%s: %s)", self._manifest_locator, type(e), str(e)) if self._keep_client is None: @@ -147,7 +153,7 @@ class CollectionReader(object): # now regenerate the manifest text based on the normalized stream #print "normalizing", self._manifest_text - self._manifest_text = ''.join([StreamReader(stream).manifest_text() for stream in self._streams]) + self._manifest_text = ''.join([StreamReader(stream, keep=self._keep_client).manifest_text() for stream in self._streams]) #print "result", self._manifest_text @@ -155,7 +161,7 @@ class CollectionReader(object): self._populate() resp = [] for s in self._streams: - resp.append(StreamReader(s)) + resp.append(StreamReader(s, keep=self._keep_client)) return resp def all_files(self): @@ -166,7 +172,7 @@ class CollectionReader(object): def manifest_text(self, strip=False): self._populate() if strip: - m = ''.join([StreamReader(stream).manifest_text(strip=True) for stream in self._streams]) + m = ''.join([StreamReader(stream, keep=self._keep_client).manifest_text(strip=True) for stream in self._streams]) return m else: return self._manifest_text