X-Git-Url: https://git.arvados.org/arvados.git/blobdiff_plain/4c8468e142d92a4dd063bde9ea1337b2161999e9..a017e1f5ac7ad49a29e302275d0f0f83754941ea:/apps/workbench/app/helpers/provenance_helper.rb diff --git a/apps/workbench/app/helpers/provenance_helper.rb b/apps/workbench/app/helpers/provenance_helper.rb index dbc7dbb976..cef5cc7ee8 100644 --- a/apps/workbench/app/helpers/provenance_helper.rb +++ b/apps/workbench/app/helpers/provenance_helper.rb @@ -1,209 +1,387 @@ +# Copyright (C) The Arvados Authors. All rights reserved. +# +# SPDX-License-Identifier: AGPL-3.0 + module ProvenanceHelper - def self.describe_node(pdata, uuid) - rsc = ArvadosBase::resource_class_for_uuid uuid.to_s - if rsc - href = "/#{rsc.to_s.underscore.pluralize rsc}/#{uuid}" - - #"\"#{uuid}\" [label=\"#{rsc}\\n#{uuid}\",href=\"#{href}\"];\n" - if rsc == Collection - if pdata[uuid] - #puts pdata[uuid] - if pdata[uuid][:name] - return "\"#{uuid}\" [label=\"#{pdata[uuid][:name]}\",href=\"#{href}\",shape=oval];\n" - else - files = nil - if pdata[uuid].respond_to? :files - files = pdata[uuid].files - elsif pdata[uuid][:files] - files = pdata[uuid][:files] - end - - if files - i = 0 - label = "" - while i < 3 and i < files.length - label += "\\n" unless label == "" - label += files[i][1] - i += 1 - end - if i < files.length - label += "\\n⋮" - end - return "\"#{uuid}\" [label=\"#{label}\",href=\"#{href}\",shape=oval];\n" - end - end - end - return "\"#{uuid}\" [label=\"#{rsc}\",href=\"#{href}\"];\n" - end - end - return "" - end - def self.job_uuid(job) - # "#{job[:script]}\\n#{job[:script_version]}" - "#{job[:script]}" - end + class GenerateGraph + def initialize(pdata, opts) + @pdata = pdata + @opts = opts + @visited = {} + @jobs = {} + @node_extra = {} + end - def self.collection_uuid(uuid) - m = /([a-f0-9]{32}(\+[0-9]+)?)(\+.*)?/.match(uuid.to_s) - if m - m[1] - else - nil + def self.collection_uuid(uuid) + Keep::Locator.parse(uuid).andand.strip_hints.andand.to_s end - end - def self.edge(tail, head, extra, opts) - if opts[:direction] == :bottom_up - gr = "\"#{tail}\" -> \"#{head}\"" - else - gr = "\"#{head}\" -> \"#{tail}\"" + def url_for u + p = { :host => @opts[:request].host, + :port => @opts[:request].port, + :protocol => @opts[:request].protocol } + p.merge! u + Rails.application.routes.url_helpers.url_for (p) end - if extra.length > 0 - gr += "[" - extra.each do |k, v| - gr += "#{k}=\"#{v}\"," - end - gr += "]" + + def determine_fillcolor(n) + fillcolor = %w(666666 669966 666699 666666 996666)[n || 0] || '666666' + "style=\"filled\",color=\"#ffffff\",fillcolor=\"##{fillcolor}\",fontcolor=\"#ffffff\"" end - gr += ";\n" - gr - end - def self.script_param_edges(pdata, visited, job, prefix, sp, opts) - gr = "" - if sp and not sp.empty? - case sp - when Hash - sp.each do |k, v| - if prefix.size > 0 - k = prefix + "::" + k.to_s - end - gr += ProvenanceHelper::script_param_edges(pdata, visited, job, k.to_s, v, opts) - end - when Array - i = 0 - node = "" - sp.each do |v| - if collection_uuid(v) - gr += ProvenanceHelper::script_param_edges(pdata, visited, job, "#{prefix}[#{i}]", v, opts) - else - node += "', '" unless node == "" - node = "['" if node == "" - node += "#{v}" - end - i += 1 + def describe_node(uuid, describe_opts={}) + bgcolor = determine_fillcolor (describe_opts[:pip] || @opts[:pips].andand[uuid]) + + rsc = ArvadosBase::resource_class_for_uuid uuid + + if GenerateGraph::collection_uuid(uuid) || rsc == Collection + if Collection.is_empty_blob_locator? uuid.to_s + # special case + return "\"#{uuid}\" [label=\"(empty collection)\"];\n" end - unless node == "" - node += "']" - #puts node - #id = "#{job[:uuid]}_#{prefix}" - gr += "\"#{node}\" [label=\"#{node}\"];\n" - gr += edge(job_uuid(job), node, {:label => prefix}, opts) + + if describe_opts[:col_uuid] + href = url_for ({:controller => Collection.to_s.tableize, + :action => :show, + :id => describe_opts[:col_uuid].to_s }) + else + href = url_for ({:controller => Collection.to_s.tableize, + :action => :show, + :id => uuid.to_s }) end + + return "\"#{uuid}\" [label=\"#{encode_quotes(describe_opts[:label] || (@pdata[uuid] and @pdata[uuid][:name]) || uuid)}\",shape=box,href=\"#{href}\",#{bgcolor}];\n" else - m = collection_uuid(sp) - if m - gr += edge(job_uuid(job), m, {:label => prefix}, opts) - gr += ProvenanceHelper::generate_provenance_edges(pdata, visited, m, opts) - elsif opts[:all_script_parameters] - #id = "#{job[:uuid]}_#{prefix}" - gr += "\"#{sp}\" [label=\"#{sp}\"];\n" - gr += edge(job_uuid(job), sp, {:label => prefix}, opts) + href = "" + if describe_opts[:href] + href = ",href=\"#{url_for ({:controller => describe_opts[:href][:controller], + :action => :show, + :id => describe_opts[:href][:id] })}\"" end + return "\"#{uuid}\" [label=\"#{encode_quotes(describe_opts[:label] || uuid)}\",#{bgcolor},shape=#{describe_opts[:shape] || 'box'}#{href}];\n" end end - gr - end - def self.generate_provenance_edges(pdata, visited, uuid, opts) - gr = "" - m = ProvenanceHelper::collection_uuid(uuid) - uuid = m if m + def job_uuid(job) + d = Digest::MD5.hexdigest(job[:script_parameters].to_json) + if @opts[:combine_jobs] == :script_only + uuid = "#{job[:script]}_#{d}" + elsif @opts[:combine_jobs] == :script_and_version + uuid = "#{job[:script]}_#{job[:script_version]}_#{d}" + else + uuid = "#{job[:uuid]}" + end + + @jobs[uuid] = [] unless @jobs[uuid] + @jobs[uuid] << job unless @jobs[uuid].include? job - uuid = uuid.intern if uuid + uuid + end - if (not uuid) or uuid.empty? or visited[uuid] + def edge(tail, head, extra) + if @opts[:direction] == :bottom_up + gr = "\"#{encode_quotes head}\" -> \"#{encode_quotes tail}\"" + else + gr = "\"#{encode_quotes tail}\" -> \"#{encode_quotes head}\"" + end - #puts "already visited #{uuid}" - return "" + if extra.length > 0 + gr += " [" + extra.each do |k, v| + gr += "#{k}=\"#{encode_quotes v}\"," + end + gr += "]" + end + gr += ";\n" + gr + end + + def script_param_edges(uuid, sp) + gr = "" + + sp.each do |k, v| + if @opts[:all_script_parameters] + if v.is_a? Array or v.is_a? Hash + encv = JSON.pretty_generate(v).gsub("\n", "\\l") + "\\l" + else + encv = v.to_json + end + gr += "\"#{encode_quotes encv}\" [shape=box];\n" + gr += edge(encv, uuid, {:label => k}) + end + end + gr end - if not pdata[uuid] then - return ProvenanceHelper::describe_node(pdata, uuid) - else - visited[uuid] = true + def job_edges job, edge_opts={} + uuid = job_uuid(job) + gr = "" + + ProvenanceHelper::find_collections job[:script_parameters] do |collection_hash, collection_uuid, key| + if collection_uuid + gr += describe_node(collection_uuid) + gr += edge(collection_uuid, uuid, {:label => key}) + else + gr += describe_node(collection_hash) + gr += edge(collection_hash, uuid, {:label => key}) + end + end + + if job[:docker_image_locator] and !@opts[:no_docker] + gr += describe_node(job[:docker_image_locator], {label: (job[:runtime_constraints].andand[:docker_image] || job[:docker_image_locator])}) + gr += edge(job[:docker_image_locator], uuid, {label: "docker_image"}) + end + + if @opts[:script_version_nodes] + gr += describe_node(job[:script_version], {:label => "git:#{job[:script_version]}"}) + gr += edge(job[:script_version], uuid, {:label => "script_version"}) + end + + if job[:output] and !edge_opts[:no_output] + gr += describe_node(job[:output]) + gr += edge(uuid, job[:output], {label: "output" }) + end + + if job[:log] and !edge_opts[:no_log] + gr += describe_node(job[:log]) + gr += edge(uuid, job[:log], {label: "log"}) + end + + gr end - #puts "visiting #{uuid}" + def cr_edges cont, edge_opts={} + uuid = cont[:uuid] + gr = "" - if m - # uuid is a collection - gr += ProvenanceHelper::describe_node(pdata, uuid) + gr += describe_node(cont[:uuid], {href: {controller: 'container_requests', + id: cont[:uuid]}, + shape: 'oval', + label: cont[:name]}) - pdata.each do |k, job| - if job[:output] == uuid.to_s - gr += self.edge(uuid, job_uuid(job), {:label => "output"}, opts) - gr += ProvenanceHelper::generate_provenance_edges(pdata, visited, job[:uuid], opts) + ProvenanceHelper::find_collections cont[:mounts] do |collection_hash, collection_uuid, key| + if @opts[:pdh_to_uuid] and @opts[:pdh_to_uuid][collection_hash] + collection_uuid = @opts[:pdh_to_uuid][collection_hash].uuid + collection_hash = nil + end + if collection_uuid and @pdata[collection_uuid] + gr += describe_node(collection_uuid) + gr += edge(collection_uuid, uuid, {:label => key}) + elsif collection_hash and @pdata[collection_hash] + gr += describe_node(collection_hash) + gr += edge(collection_hash, uuid, {:label => key}) end - if job[:log] == uuid.to_s - gr += edge(uuid, job_uuid(job), {:label => "log"}, opts) - gr += ProvenanceHelper::generate_provenance_edges(pdata, visited, job[:uuid], opts) + end + + if cont[:container_image] and !@opts[:no_docker] and @pdata[cont[:container_image]] + gr += describe_node(cont[:container_image], {label: cont[:container_image]}) + gr += edge(cont[:container_image], uuid, {label: "docker_image"}) + end + + if cont[:output_uuid] and !edge_opts[:no_output] and @pdata[cont[:output_uuid]] + gr += describe_node(cont[:output_uuid]) + gr += edge(uuid, cont[:output_uuid], {label: "output" }) + end + + if cont[:log_uuid] and !edge_opts[:no_log] and @pdata[cont[:log_uuid]] + gr += describe_node(cont[:log_uuid]) + gr += edge(uuid, cont[:log_uuid], {label: "log"}) + end + + gr + end + + def container_edges cont, edge_opts={} + uuid = cont[:uuid] + gr = "" + + gr += describe_node(cont[:uuid], {href: {controller: 'containers', + id: cont[:uuid]}, + shape: 'oval'}) + + ProvenanceHelper::find_collections cont[:mounts] do |collection_hash, collection_uuid, key| + if collection_uuid and @pdata[collection_uuid] + gr += describe_node(collection_uuid) + gr += edge(collection_uuid, uuid, {:label => key}) + elsif collection_hash and @pdata[collection_hash] + gr += describe_node(collection_hash) + gr += edge(collection_hash, uuid, {:label => key}) end end - else - # uuid is something else - rsc = ArvadosBase::resource_class_for_uuid uuid.to_s - if rsc == Job - job = pdata[uuid] + if cont[:container_image] and !@opts[:no_docker] and @pdata[cont[:container_image]] + gr += describe_node(cont[:container_image], {label: cont[:container_image]}) + gr += edge(cont[:container_image], uuid, {label: "docker_image"}) + end + + if cont[:output] and !edge_opts[:no_output] and @pdata[cont[:output]] + gr += describe_node(cont[:output]) + gr += edge(uuid, cont[:output], {label: "output" }) + end + + if cont[:log] and !edge_opts[:no_log] and @pdata[cont[:log]] + gr += describe_node(cont[:log]) + gr += edge(uuid, cont[:log], {label: "log"}) + end + + gr + end + + def generate_provenance_edges(uuid) + gr = "" + m = GenerateGraph::collection_uuid(uuid) + uuid = m if m + + if uuid.nil? or uuid.empty? or @visited[uuid] + return "" + end + + if @pdata[uuid].nil? + return "" + else + @visited[uuid] = true + end + + if uuid.start_with? "component_" + # Pipeline component inputs + job = @pdata[@pdata[uuid][:job].andand[:uuid]] + if job - gr += ProvenanceHelper::script_param_edges(pdata, visited, job, "", job[:script_parameters], opts) + gr += describe_node(job_uuid(job), {label: uuid[38..-1], pip: @opts[:pips].andand[job[:uuid]], shape: "oval", + href: {controller: 'jobs', id: job[:uuid]}}) + gr += job_edges job, {no_output: true, no_log: true} + end + + # Pipeline component output + outuuid = @pdata[uuid][:output_uuid] + if outuuid + outcollection = @pdata[outuuid] + if outcollection + gr += edge(job_uuid(job), outcollection[:portable_data_hash], {label: "output"}) + gr += describe_node(outcollection[:portable_data_hash], {label: outcollection[:name]}) + end + elsif job and job[:output] + gr += describe_node(job[:output]) + gr += edge(job_uuid(job), job[:output], {label: "output" }) end else - gr += ProvenanceHelper::describe_node(pdata, uuid) + rsc = ArvadosBase::resource_class_for_uuid uuid + + if rsc == Job + job = @pdata[uuid] + gr += job_edges job if job + elsif rsc == ContainerRequest + cr = @pdata[uuid] + gr += cr_edges cr if cr + elsif rsc == Container + cr = @pdata[uuid] + gr += container_edges cr if cr + end end - end - pdata.each do |k, link| - if link[:head_uuid] == uuid.to_s and link[:link_class] == "provenance" - gr += ProvenanceHelper::describe_node(pdata, link[:tail_uuid]) - gr += edge(link[:head_uuid], link[:tail_uuid], {:label => link[:name], :href => "/links/#{link[:uuid]}"}, opts) - gr += ProvenanceHelper::generate_provenance_edges(pdata, visited, link[:tail_uuid], opts) + @pdata.each do |k, link| + if link[:head_uuid] == uuid.to_s and link[:link_class] == "provenance" + href = url_for ({:controller => Link.to_s.tableize, + :action => :show, + :id => link[:uuid] }) + + gr += describe_node(link[:tail_uuid]) + gr += edge(link[:head_uuid], link[:tail_uuid], {:label => link[:name], :href => href}) + gr += generate_provenance_edges(link[:tail_uuid]) + end end + + gr end - #puts "finished #{uuid}" + def describe_jobs + gr = "" + @jobs.each do |k, v| + href = url_for ({:controller => Job.to_s.tableize, + :action => :index }) + + gr += "\"#{k}\" [href=\"#{href}?" + + n = 0 + v.each do |u| + gr += ";" unless gr.end_with? "?" + gr += "uuid%5b%5d=#{u[:uuid]}" + n |= @opts[:pips][u[:uuid]] if @opts[:pips] and @opts[:pips][u[:uuid]] + end + + gr += "\",label=\"" + + label = "#{v[0][:script]}" + + if label == "run-command" and v[0][:script_parameters][:command].is_a? Array + label = v[0][:script_parameters][:command].join(' ') + end + + if not @opts[:combine_jobs] + label += "\\n#{v[0][:finished_at]}" + end + + gr += encode_quotes label + + gr += "\",#{determine_fillcolor n}];\n" + end + gr + end - gr + def encode_quotes value + value.to_s.gsub("\"", "\\\"").gsub("\n", "\\n") + end end - def self.create_provenance_graph(pdata, uuid, opts={}) - require 'open3' - - gr = """strict digraph { -node [fontsize=8,shape=box]; -edge [fontsize=8];""" + def self.create_provenance_graph(pdata, svgId, opts={}) + if pdata.is_a? Array or pdata.is_a? ArvadosResourceList + p2 = {} + pdata.each do |k| + p2[k[:uuid]] = k if k[:uuid] + end + pdata = p2 + end + + unless pdata.is_a? Hash + raise "create_provenance_graph accepts Array or Hash for pdata only, pdata is #{pdata.class}" + end - if opts[:direction] == :bottom_up - gr += "edge [dir=back];" + gr = """strict digraph { +node [fontsize=10,fontname=\"Helvetica,Arial,sans-serif\"]; +edge [fontsize=10,fontname=\"Helvetica,Arial,sans-serif\"]; +""" + if ["LR", "RL"].include? opts[:direction] + gr += "rankdir=#{opts[:direction]};" end - #puts "pdata is #{pdata}" + begin + pdata = pdata.stringify_keys + + g = GenerateGraph.new(pdata, opts) + + pdata.each do |k, v| + if !opts[:only_components] or k.start_with? "component_" + gr += g.generate_provenance_edges(k) + else + #gr += describe_node(k) + end + end - visited = {} - if uuid.respond_to? :each - uuid.each do |u| - gr += ProvenanceHelper::generate_provenance_edges(pdata, visited, u, opts) + if !opts[:only_components] + gr += g.describe_jobs end - else - gr += ProvenanceHelper::generate_provenance_edges(pdata, visited, uuid, opts) + + rescue => e + Rails.logger.warn "#{e.inspect}" + Rails.logger.warn "#{e.backtrace.join("\n\t")}" + raise end gr += "}" svg = "" - #puts gr + require 'open3' Open3.popen2("dot", "-Tsvg") do |stdin, stdout, wait_thr| stdin.print(gr) @@ -215,5 +393,45 @@ edge [fontsize=8];""" svg = svg.sub(/<\?xml.*?\?>/m, "") svg = svg.sub(//m, "") + svg = svg.sub(/