X-Git-Url: https://git.arvados.org/arvados.git/blobdiff_plain/da51b9328abab2df757ed13eadc7c3557315094b..71c66323a0ac9ce0cacf3ed3585a07562553096d:/services/api/app/models/collection.rb diff --git a/services/api/app/models/collection.rb b/services/api/app/models/collection.rb index 03e5e4ef44..24e4ccc0ab 100644 --- a/services/api/app/models/collection.rb +++ b/services/api/app/models/collection.rb @@ -1,5 +1,5 @@ class Collection < ArvadosModel - include AssignUuid + include HasUuid include KindAndEtag include CommonApiTemplate @@ -8,6 +8,10 @@ class Collection < ArvadosModel t.add :files end + api_accessible :with_data, extend: :user do |t| + t.add :manifest_text + end + def redundancy_status if redundancy_confirmed_as.nil? 'unconfirmed' @@ -33,14 +37,14 @@ class Collection < ArvadosModel self.uuid.gsub! /$/, '+' + self.manifest_text.length.to_s true else - errors.add :uuid, 'uuid does not match checksum of manifest_text' + errors.add :uuid, 'does not match checksum of manifest_text' false end elsif self.manifest_text - errors.add :uuid, 'checksum for manifest_text not supplied in uuid' + errors.add :uuid, 'not supplied (must match checksum of manifest_text)' false else - errors.add :manifest_text, 'manifest_text not supplied' + errors.add :manifest_text, 'not supplied' false end end @@ -61,8 +65,19 @@ class Collection < ArvadosModel @files = [] return end + + #normalized_manifest = "" + #IO.popen(['arv-normalize'], 'w+b') do |io| + # io.write manifest_text + # io.close_write + # while buf = io.read(2**20) + # normalized_manifest += buf + # end + #end + @data_size = 0 - @files = [] + tmp = {} + manifest_text.split("\n").each do |stream| toks = stream.split(" ") @@ -94,10 +109,91 @@ class Collection < ArvadosModel else $1.to_i(8).chr end end - @files << [stream, filename, re[2].to_i] + fn = stream + '/' + filename + i = re[2].to_i + if tmp[fn] + tmp[fn] += i + else + tmp[fn] = i + end end end end end + + @files = [] + tmp.each do |k, v| + re = k.match(/^(.+)\/(.+)/) + @files << [re[1], re[2], v] + end + end + + def self.uuid_like_pattern + "________________________________+%" + end + + def self.normalize_uuid uuid + hash_part = nil + size_part = nil + uuid.split('+').each do |token| + if token.match /^[0-9a-f]{32,}$/ + raise "uuid #{uuid} has multiple hash parts" if hash_part + hash_part = token + elsif token.match /^\d+$/ + raise "uuid #{uuid} has multiple size parts" if size_part + size_part = token + end + end + raise "uuid #{uuid} has no hash part" if !hash_part + [hash_part, size_part].compact.join '+' + end + + def self.uuids_for_docker_image(search_term, search_tag=nil, readers=nil) + readers ||= [Thread.current[:user]] + base_search = Link. + readable_by(*readers). + readable_by(*readers, table_name: "collections"). + joins("JOIN collections ON links.head_uuid = collections.uuid"). + order("links.created_at DESC") + + # If the search term is a Collection locator with an associated + # Docker image hash link, return that Collection. + coll_matches = base_search. + where(link_class: "docker_image_hash", collections: {uuid: search_term}) + if match = coll_matches.first + return [match.head_uuid] + end + + # Find Collections with matching Docker image repository+tag pairs. + matches = base_search. + where(link_class: "docker_image_repo+tag", + name: "#{search_term}:#{search_tag || 'latest'}") + + # If that didn't work, find Collections with matching Docker image hashes. + if matches.empty? + matches = base_search. + where("link_class = ? and name LIKE ?", + "docker_image_hash", "#{search_term}%") + end + + # Generate an order key for each result. We want to order the results + # so that anything with an image timestamp is considered more recent than + # anything without; then we use the link's created_at as a tiebreaker. + uuid_timestamps = {} + matches.find_each do |link| + uuid_timestamps[link.head_uuid] = + [(-link.properties["image_timestamp"].to_datetime.to_i rescue 0), + -link.created_at.to_i] + end + uuid_timestamps.keys.sort_by { |uuid| uuid_timestamps[uuid] } + end + + def self.for_latest_docker_image(search_term, search_tag=nil, readers=nil) + image_uuid = uuids_for_docker_image(search_term, search_tag, readers).last + if image_uuid.nil? + nil + else + find_by_uuid(image_uuid) + end end end