Merge branch '19215-installer' refs #19215

author Peter Amstutz <peter.amstutz@curii.com>

Mon, 5 Dec 2022 18:43:01 +0000 (13:43 -0500)

committer Peter Amstutz <peter.amstutz@curii.com>

Mon, 5 Dec 2022 18:43:01 +0000 (13:43 -0500)
author Peter Amstutz <peter.amstutz@curii.com>
Mon, 5 Dec 2022 18:43:01 +0000 (13:43 -0500)
committer Peter Amstutz <peter.amstutz@curii.com>
Mon, 5 Dec 2022 18:43:01 +0000 (13:43 -0500)
diff --git a/.gitignore b/.gitignore

index 07482bde73e01d82f590b6b3fa1d9e1f95719001..c156018036e74a3582e922d97b610d450d5fbac9 100644 (file)
--- a/.gitignore
+++ b/.gitignore
@@ -14,10 +14,6 @@ doc/.site
  doc/sdk/python/arvados
  doc/sdk/R/arvados
  doc/sdk/java-v2/javadoc
-sdk/perl/MYMETA.*
-sdk/perl/Makefile
-sdk/perl/blib
-sdk/perl/pm_to_blib
  */vendor
  */*/vendor
  sdk/java/target
diff --git a/apps/workbench/Gemfile.lock b/apps/workbench/Gemfile.lock

index a70add7affbafd5364b1bc86149a26af4860c893..c66272cd3f965ebe198ec9fea8d70f455c8cb270 100644 (file)
--- a/apps/workbench/Gemfile.lock
+++ b/apps/workbench/Gemfile.lock
@@ -179,14 +179,14 @@ GEM
      net-ssh-gateway (2.0.0)
        net-ssh (>= 4.0.0)
      nio4r (2.5.8)
-    nokogiri (1.13.7)
+    nokogiri (1.13.9)
        mini_portile2 (~> 2.8.0)
        racc (~> 1.4)
      npm-rails (0.2.1)
        rails (>= 3.2)
      oj (3.7.12)
      os (1.1.1)
-    passenger (6.0.2)
+    passenger (6.0.15)
        rack
        rake (>= 0.8.1)
      piwik_analytics (1.0.2)
diff --git a/apps/workbench/app/helpers/version_helper.rb b/apps/workbench/app/helpers/version_helper.rb

index e673c812102143d451fa48887b4cdf9d28e060a6..d11071272b28728038710969543c5ec908d4e958 100644 (file)
--- a/apps/workbench/app/helpers/version_helper.rb
+++ b/apps/workbench/app/helpers/version_helper.rb
@@ -17,6 +17,6 @@ module VersionHelper
  
    # URL for browsing source code for the given version.
    def version_link_target version
-    "https://arvados.org/projects/arvados/repository/changes?rev=#{version.sub(/-.*/, "")}"
+    "https://dev.arvados.org/projects/arvados/repository/changes?rev=#{version.sub(/-.*/, "")}"
    end
  end
diff --git a/apps/workbench/app/views/users/_tables.html.erb b/apps/workbench/app/views/users/_tables.html.erb

index 01a77cdd6188fd35ea409e9c8e90c7f5babb29b4..6e3d9e3437ad34abde3be6ef3166d8dc6bf20f02 100644 (file)
--- a/apps/workbench/app/views/users/_tables.html.erb
+++ b/apps/workbench/app/views/users/_tables.html.erb
@@ -254,7 +254,7 @@ SPDX-License-Identifier: AGPL-3.0 %>
            <%= link_to "contact us", Rails.configuration.Workbench.ActivationContactLink %>.
            You should receive an email at the address you used to log in when
            your account is activated.  In the mean time, you can
-          <%= link_to "learn more about Arvados", "https://arvados.org/projects/arvados/wiki/Introduction_to_Arvados" %>,
+          <%= link_to "learn more about Arvados", "https://arvados.org/" %>,
            and <%= link_to "read the Arvados user guide", "http://doc.arvados.org/user" %>.
          </p>
          <p style="padding-bottom: 1em">
diff --git a/apps/workbench/test/integration/report_issue_test.rb b/apps/workbench/test/integration/report_issue_test.rb

index d2c4372bce0de489954afa620fabd861f1b42948..98ce8aad141f1627a466ba87ccbe98da0fef9817 100644 (file)
--- a/apps/workbench/test/integration/report_issue_test.rb
+++ b/apps/workbench/test/integration/report_issue_test.rb
@@ -37,7 +37,7 @@ class ReportIssueTest < ActionDispatch::IntegrationTest
        assert page.has_button?('Close'), 'No button - Close'
        assert page.has_no_button?('Send problem report'), 'Found button - Send problem report'
        history_links = all('a').select do |a|
-        a[:href] =~ %r!^https://arvados.org/projects/arvados/repository/changes\?rev=[0-9a-f]+$!
+        a[:href] =~ %r!^https://dev.arvados.org/projects/arvados/repository/changes\?rev=[0-9a-f]+$!
        end
        assert_operator(2, :<=, history_links.count,
                        "Should have found two links to revision history " +
diff --git a/build/package-build-dockerfiles/centos7/Dockerfile b/build/package-build-dockerfiles/centos7/Dockerfile

index 5bae5f434c32b5eb86bf7c4e496dfb8f08839ba6..f0ae5df3f74eb3655db25988fcf5526fcd59414b 100644 (file)
--- a/build/package-build-dockerfiles/centos7/Dockerfile
+++ b/build/package-build-dockerfiles/centos7/Dockerfile
@@ -32,7 +32,7 @@ ENV DEBIAN_FRONTEND noninteractive
  
  SHELL ["/bin/bash", "-c"]
  # Install dependencies.
-RUN yum -q -y install make automake gcc gcc-c++ libyaml-devel patch readline-devel zlib-devel libffi-devel openssl-devel bzip2 libtool bison sqlite-devel rpm-build git perl-ExtUtils-MakeMaker libattr-devel nss-devel libcurl-devel which tar unzip scl-utils centos-release-scl postgresql-devel fuse-devel xz-libs git wget pam-devel
+RUN yum -q -y install make automake gcc gcc-c++ libyaml-devel patch readline-devel zlib-devel libffi-devel openssl-devel bzip2 libtool bison sqlite-devel rpm-build git libattr-devel nss-devel libcurl-devel which tar unzip scl-utils centos-release-scl postgresql-devel fuse-devel xz-libs git wget pam-devel
  
  # Install RVM
  ADD generated/mpapis.asc /tmp/
diff --git a/build/run-build-packages-one-target.sh b/build/run-build-packages-one-target.sh

index 7d9b5b6a37abb14185a693ff331859137d7f4082..905af1cbc62a76cc314ccba3dcdd9fa1145d2586 100755 (executable)
--- a/build/run-build-packages-one-target.sh
+++ b/build/run-build-packages-one-target.sh
@@ -232,7 +232,6 @@ if test -z "$packages" ; then
          keep-rsync
          keep-block-check
          keep-web
-        libarvados-perl
          libpam-arvados-go
          python3-cwltest
          python3-arvados-fuse
diff --git a/build/run-build-packages.sh b/build/run-build-packages.sh

index d4240d4f26b9120c3477aff6460a66aa3c169955..aded25b592a3a941e794d0223cd0f0c8ea5f412a 100755 (executable)
--- a/build/run-build-packages.sh
+++ b/build/run-build-packages.sh
@@ -207,11 +207,6 @@ fi
  # Required due to CVE-2022-24765
  git config --global --add safe.directory /arvados
  
-# Perl packages
-debug_echo -e "\nPerl packages\n"
-
-handle_libarvados_perl
-
  # Ruby gems
  debug_echo -e "\nRuby gems\n"
  
diff --git a/build/run-library.sh b/build/run-library.sh

index 47c5e2a39a22f98cc0ad18631e814ea4f4285c63..c2466faac0f38f66ade7a3e2d3c509a1e9acbbe8 100755 (executable)
--- a/build/run-library.sh
+++ b/build/run-library.sh
@@ -696,40 +696,6 @@ handle_arvados_src () {
    )
  }
  
-# Usage: handle_libarvados_perl
-handle_libarvados_perl () {
-  if [[ -n "$ONLY_BUILD" ]] && [[ "$ONLY_BUILD" != "libarvados-perl" ]] ; then
-    debug_echo -e "Skipping build of libarvados-perl package."
-    return 0
-  fi
-  # The perl sdk subdirectory is so old that it has no tag in its history,
-  # which causes version_at_commit.sh to fail. Just rebuild it every time.
-  cd "$WORKSPACE"
-  libarvados_perl_version="$(version_from_git)"
-  cd "$WORKSPACE/sdk/perl"
-
-  cd $WORKSPACE/packages/$TARGET
-  test_package_presence libarvados-perl "$libarvados_perl_version"
-
-  if [[ "$?" == "0" ]]; then
-    cd "$WORKSPACE/sdk/perl"
-
-    if [[ -e Makefile ]]; then
-      make realclean >"$STDOUT_IF_DEBUG"
-    fi
-    find -maxdepth 1 \( -name 'MANIFEST*' -or -name "libarvados-perl*.$FORMAT" \) \
-        -delete
-    rm -rf install
-
-    perl Makefile.PL INSTALL_BASE=install >"$STDOUT_IF_DEBUG" && \
-        make install INSTALLDIRS=perl >"$STDOUT_IF_DEBUG" && \
-        fpm_build "$WORKSPACE/sdk/perl" install/lib/=/usr/share libarvados-perl \
-        dir "$libarvados_perl_version" install/man/=/usr/share/man \
-        "$WORKSPACE/apache-2.0.txt=/usr/share/doc/libarvados-perl/apache-2.0.txt" && \
-        mv --no-clobber libarvados-perl*.$FORMAT "$WORKSPACE/packages/$TARGET/"
-  fi
-}
-
  # Build python packages with a virtualenv built-in
  # Usage: fpm_build_virtualenv arvados-python-client sdk/python [deb|rpm] [amd64|arm64]
  fpm_build_virtualenv () {
diff --git a/build/run-tests.sh b/build/run-tests.sh

index ee52c4b9dd1a625d99a14f4ac279731424236175..a5c7277580496cd1fe4748aed040ce2261bd3e95 100755 (executable)
--- a/build/run-tests.sh
+++ b/build/run-tests.sh
@@ -58,7 +58,7 @@ defaults to $HOME/arvados-api-server if that directory exists.
  
  More information and background:
  
-https://arvados.org/projects/arvados/wiki/Running_tests
+https://dev.arvados.org/projects/arvados/wiki/Running_tests
  
  Available tests:
  
@@ -150,7 +150,6 @@ VENVDIR=
  VENV3DIR=
  PYTHONPATH=
  GEMHOME=
-PERLINSTALLBASE=
  R_LIBS=
  export LANG=en_US.UTF-8
  
@@ -232,14 +231,6 @@ sanity_checks() {
      echo -n 'nginx: '
      PATH="$PATH:/sbin:/usr/sbin:/usr/local/sbin" nginx -v \
          || fatal "No nginx. Try: apt-get install nginx"
-    echo -n 'perl: '
-    perl -v | grep version \
-        || fatal "No perl. Try: apt-get install perl"
-    for mod in ExtUtils::MakeMaker JSON LWP Net::SSL; do
-        echo -n "perl $mod: "
-        perl -e "use $mod; print \"\$$mod::VERSION\\n\"" \
-            || fatal "No $mod. Try: apt-get install perl-modules libcrypt-ssleay-perl libjson-perl libwww-perl"
-    done
      echo -n 'gitolite: '
      which gitolite \
          || fatal "No gitolite. Try: apt-get install gitolite3"
@@ -621,7 +612,7 @@ initialize() {
      fi
  
      # Set up temporary install dirs (unless existing dirs were supplied)
-    for tmpdir in VENV3DIR GOPATH GEMHOME PERLINSTALLBASE R_LIBS
+    for tmpdir in VENV3DIR GOPATH GEMHOME R_LIBS
      do
          if [[ -z "${!tmpdir}" ]]; then
              eval "$tmpdir"="$temp/$tmpdir"
@@ -633,9 +624,6 @@ initialize() {
  
      rm -vf "${WORKSPACE}/tmp/*.log"
  
-    export PERLINSTALLBASE
-    export PERL5LIB="$PERLINSTALLBASE/lib/perl5${PERL5LIB:+:$PERL5LIB}"
-
      export R_LIBS
  
      export GOPATH
@@ -928,17 +916,12 @@ install_sdk/R() {
    fi
  }
  
-install_sdk/perl() {
-    cd "$WORKSPACE/sdk/perl" \
-        && perl Makefile.PL INSTALL_BASE="$PERLINSTALLBASE" \
-        && make install INSTALLDIRS=perl
-}
-
  install_sdk/cli() {
      install_gem arvados-cli sdk/cli
  }
  
  install_services/login-sync() {
+    install_gem arvados sdk/ruby
      install_gem arvados-login-sync services/login-sync
  }
  
@@ -1096,7 +1079,6 @@ install_deps() {
      do_install env
      do_install cmd/arvados-server go
      do_install sdk/cli
-    do_install sdk/perl
      do_install sdk/python pip "${VENV3DIR}/bin/"
      do_install sdk/ruby
      do_install services/api
@@ -1109,7 +1091,6 @@ install_all() {
      do_install doc
      do_install sdk/ruby
      do_install sdk/R
-    do_install sdk/perl
      do_install sdk/cli
      do_install services/login-sync
      for p in "${pythonstuff[@]}"
diff --git a/doc/_config.yml b/doc/_config.yml

index 93d915039c626d01f69d2127dd458b04a6b826f8..96ac4252ef983841b8cd59a0f6e591e4a8c5ee3b 100644 (file)
--- a/doc/_config.yml
+++ b/doc/_config.yml
@@ -89,6 +89,7 @@ navbar:
        - sdk/cli/index.html.textile.liquid
        - sdk/cli/reference.html.textile.liquid
        - sdk/cli/subcommands.html.textile.liquid
+      - sdk/cli/project-management.html.textile.liquid
      - Go:
        - sdk/go/index.html.textile.liquid
        - sdk/go/example.html.textile.liquid
@@ -102,9 +103,6 @@ navbar:
        - sdk/java-v2/index.html.textile.liquid
        - sdk/java-v2/example.html.textile.liquid
        - sdk/java-v2/javadoc.html.textile.liquid
-    - Perl:
-      - sdk/perl/index.html.textile.liquid
-      - sdk/perl/example.html.textile.liquid
    api:
      - Concepts:
        - api/index.html.textile.liquid
@@ -131,6 +129,7 @@ navbar:
        - api/keep-s3.html.textile.liquid
        - api/keep-web-urls.html.textile.liquid
        - api/projects.html.textile.liquid
+      - api/properties.html.textile.liquid
        - api/methods/collections.html.textile.liquid
        - api/methods/repositories.html.textile.liquid
      - Container engine:
@@ -172,21 +171,22 @@ navbar:
      - Users and Groups:
        - admin/user-management.html.textile.liquid
        - admin/user-management-cli.html.textile.liquid
+      - admin/group-management.html.textile.liquid
        - admin/reassign-ownership.html.textile.liquid
        - admin/link-accounts.html.textile.liquid
-      - admin/group-management.html.textile.liquid
        - admin/federation.html.textile.liquid
        - admin/merge-remote-account.html.textile.liquid
        - admin/migrating-providers.html.textile.liquid
        - user/topics/arvados-sync-external-sources.html.textile.liquid
        - admin/scoped-tokens.html.textile.liquid
        - admin/token-expiration-policy.html.textile.liquid
-      - admin/user-activity.html.textile.liquid
      - Monitoring:
        - admin/logging.html.textile.liquid
        - admin/metrics.html.textile.liquid
        - admin/health-checks.html.textile.liquid
+      - admin/diagnostics.html.textile.liquid
        - admin/management-token.html.textile.liquid
+      - admin/user-activity.html.textile.liquid
      - Data Management:
        - admin/collection-versioning.html.textile.liquid
        - admin/collection-managed-properties.html.textile.liquid
diff --git a/doc/admin/diagnostics.html.textile.liquid b/doc/admin/diagnostics.html.textile.liquid

new file mode 100644 (file)

index 0000000..ec6a9bf
--- /dev/null
+++ b/doc/admin/diagnostics.html.textile.liquid
@@ -0,0 +1,83 @@
+---
+layout: default
+navsection: admin
+title: Diagnostics
+...
+
+{% comment %}
+Copyright (C) The Arvados Authors. All rights reserved.
+
+SPDX-License-Identifier: CC-BY-SA-3.0
+{% endcomment %}
+
+The @arvados-client diagnostics@ command exercises basic cluster functionality, and identifies some common installation and configuration problems. Especially after upgrading or reconfiguring Arvados or server/network infrastructure, it can be the quickest way to identify problems.
+
+h2. Using system privileges
+
+On a server node, it is easiest to run the diagnostics command with system privileges. The word @sudo@ here instructs the @arvados-client@ command to load @Controller.ExternalURL@ and @SystemRootToken@ from @/etc/arvados/config.yml@ and use those credentials to run tests with system privileges.
+
+When run this way, diagnostics will also include "health checks":health-checks.html.
+
+<notextile><pre>
+# <span class="userinput">arvados-client sudo diagnostics</span>
+</pre></notextile>
+
+h2. Using regular user privileges
+
+On any node (server node, shell node, or a workstation outside the system network), you can also run diagnostics by setting the usual @ARVADOS_API_HOST@ and @ARVADOS_API_TOKEN@ environment variables. Typically this is done with a regular user account.
+
+<notextile><pre>
+$ <span class="userinput">export ARVADOS_API_HOST=zzzzz.arvadosapi.com</span>
+$ <span class="userinput">export ARVADOS_API_TOKEN=xxxxxxxxxx</span>
+$ <span class="userinput">arvados-client diagnostics</span>
+</pre></notextile>
+
+h2. Internal/external client detection
+
+The diagnostics output indicates whether its client connection is categorized by the server as internal or external. If you run diagnostics automatically with cron or a monitoring tool, you can use the @-internal-client@ or @-external-client@ flag to specify how you _expect_ the client to be categorized, and the test will fail otherwise. Example:
+
+<notextile><pre>
+# <span class="userinput">arvados-client sudo diagnostics -internal-client</span>
+[...]
+
+--- cut here --- error summary ---
+
+ERROR     60: checking internal/external client detection (11 ms): expecting internal=true external=false, but found internal=false external=true
+</pre></notextile>
+
+h2. Example output
+
+<notextile><pre>
+# <span class="userinput">arvados-client sudo diagnostics</span>
+INFO       5: running health check (same as `arvados-server check`)
+INFO      10: getting discovery document from https://zzzzz.arvadosapi.com/discovery/v1/apis/arvados/v1/rest
+INFO      20: getting exported config from https://zzzzz.arvadosapi.com/arvados/v1/config
+INFO      30: getting current user record
+INFO      40: connecting to service endpoint https://keep.zzzzz.arvadosapi.com/
+INFO      41: connecting to service endpoint https://*.collections.zzzzz.arvadosapi.com/
+INFO      42: connecting to service endpoint https://download.zzzzz.arvadosapi.com/
+INFO      43: connecting to service endpoint wss://ws.zzzzz.arvadosapi.com/websocket
+INFO      44: connecting to service endpoint https://workbench.zzzzz.arvadosapi.com/
+INFO      45: connecting to service endpoint https://workbench2.zzzzz.arvadosapi.com/
+INFO      50: checking CORS headers at https://zzzzz.arvadosapi.com/
+INFO      51: checking CORS headers at https://keep.zzzzz.arvadosapi.com/d41d8cd98f00b204e9800998ecf8427e+0
+INFO      52: checking CORS headers at https://download.zzzzz.arvadosapi.com/
+INFO      60: checking internal/external client detection
+INFO      61: reading+writing via keep service at https://keep.zzzzz.arvadosapi.com:443/
+INFO      80: finding/creating "scratch area for diagnostics" project
+INFO      90: creating temporary collection
+INFO     100: uploading file via webdav
+INFO     110: checking WebDAV ExternalURL wildcard (https://*.collections.zzzzz.arvadosapi.com/)
+INFO     120: downloading from webdav (https://d41d8cd98f00b204e9800998ecf8427e-0.collections.zzzzz.arvadosapi.com/foo)
+INFO     121: downloading from webdav (https://d41d8cd98f00b204e9800998ecf8427e-0.collections.zzzzz.arvadosapi.com/sha256:feb5d9fea6a5e9606aa995e879d862b825965ba48de054caab5ef356dc6b3412.tar)
+INFO     122: downloading from webdav (https://download.zzzzz.arvadosapi.com/c=d41d8cd98f00b204e9800998ecf8427e+0/_/foo)
+INFO     123: downloading from webdav (https://download.zzzzz.arvadosapi.com/c=d41d8cd98f00b204e9800998ecf8427e+0/_/sha256:feb5d9fea6a5e9606aa995e879d862b825965ba48de054caab5ef356dc6b3412.tar)
+INFO     124: downloading from webdav (https://a15a27cbc1c7d2d4a0d9e02529aaec7e-128.collections.zzzzz.arvadosapi.com/sha256:feb5d9fea6a5e9606aa995e879d862b825965ba48de054caab5ef356dc6b3412.tar)
+INFO     125: downloading from webdav (https://download.zzzzz.arvadosapi.com/c=zzzzz-4zz18-twitqma8mbvwydy/_/sha256:feb5d9fea6a5e9606aa995e879d862b825965ba48de054caab5ef356dc6b3412.tar)
+INFO     130: getting list of virtual machines
+INFO     140: getting workbench1 webshell page
+INFO     150: connecting to webshell service
+INFO     160: running a container
+INFO      ... container request submitted, waiting up to 10m for container to run
+INFO    9990: deleting temporary collection
+</pre></notextile>
diff --git a/doc/admin/federation.html.textile.liquid b/doc/admin/federation.html.textile.liquid

index 74480e7dee5000c14815475ea74d5e65d301ac13..acc7f6fbe61fe7563bbf2a818c2af74c0c628b51 100644 (file)
--- a/doc/admin/federation.html.textile.liquid
+++ b/doc/admin/federation.html.textile.liquid
@@ -25,11 +25,11 @@ Clusters:
    clsr1:
      RemoteClusters:
        clsr2:
-        Host: api.cluster2.com
+        Host: api.cluster2.example
          Proxy: true
         ActivateUsers: true
        clsr3:
-        Host: api.cluster3.com
+        Host: api.cluster3.example
          Proxy: true
         ActivateUsers: false
  </pre>
@@ -82,8 +82,10 @@ Clusters:
    clsr1:
      Login:
        TrustedClients:
-        "https://workbench.cluster2.com": {}
-        "https://workbench.cluster3.com": {}
+        "https://workbench.cluster2.example": {}
+        "https://workbench2.cluster2.example": {}
+        "https://workbench.cluster3.example": {}
+        "https://workbench2.cluster3.example": {}
  </pre>
  
  h2. Testing
@@ -91,7 +93,7 @@ h2. Testing
  Following the above example, let's suppose @clsr1@ is our "home cluster", that is to say, we use our @clsr1@ user account as our federated identity and both @clsr2@ and @clsr3@ remote clusters are set up to allow users from @clsr1@ and to auto-activate them. The first thing to do would be to log into a remote workbench using the local user token. This can be done following these steps:
  
  1. Log into the local workbench and get the user token
-2. Visit the remote workbench specifying the local user token by URL: @https://workbench.cluster2.com?api_token=token_from_clsr1@
+2. Visit the remote workbench specifying the local user token by URL: @https://workbench.cluster2.example?api_token=token_from_clsr1@
  3. You should now be logged into @clsr2@ with your account from @clsr1@
  
  To further test the federation setup, you can create a collection on @clsr2@, uploading some files and copying its UUID. Next, logged into a shell node on your home cluster you should be able to get that collection by running:
diff --git a/doc/admin/group-management.html.textile.liquid b/doc/admin/group-management.html.textile.liquid

index dddfe13ac85d4aca8b0407f9f7b1f562f15aae8a..43319e873a577717ae0aee65cf6e023c08770939 100644 (file)
--- a/doc/admin/group-management.html.textile.liquid
+++ b/doc/admin/group-management.html.textile.liquid
@@ -1,7 +1,7 @@
  ---
  layout: default
  navsection: admin
-title: Group management
+title: Role group management at the CLI
  ...
  
  {% comment %}
@@ -12,7 +12,7 @@ SPDX-License-Identifier: CC-BY-SA-3.0
  
  This page describes how to manage groups at the command line.  You should be familiar with the "permission system":{{site.baseurl}}/api/permission-model.html .
  
-h2. Create a group
+h2. Create a role group
  
  User groups are entries in the "groups" table with @"group_class": "role"@.
  
@@ -20,7 +20,7 @@ User groups are entries in the "groups" table with @"group_class": "role"@.
  arv group create --group '{"name": "My new group", "group_class": "role"}'
  </pre>
  
-h2(#add). Add a user to a group
+h2(#add). Add a user to a role group
  
  There are two separate permissions associated with group membership.  The first link grants the user @can_manage@ permission to manage things that the group can manage.  The second link grants permission for other users of the group to see that this user is part of the group.
  
@@ -40,13 +40,13 @@ arv link create --link '{
  
  A user can also be given read-only access to a group.  In that case, the first link should be created with @can_read@ instead of @can_manage@.
  
-h2. List groups
+h2. List role groups
  
  <pre>
  arv group list --filters '[["group_class", "=", "role"]]'
  </pre>
  
-h2. List members of a group
+h2. List members of a role group
  
  Use the command "jq":https://stedolan.github.io/jq/ to extract the tail_uuid of each permission link which has the user uuid.
  
@@ -55,9 +55,9 @@ arv link list --filters '[["link_class", "=", "permission"],
    ["head_uuid", "=", "the_group_uuid"]]' | jq .items[].tail_uuid
  </pre>
  
-h2. Share a project with a group
+h2(#share-project). Share a project with a role group
  
-This will give all members of the group @can_manage@ access.
+Members of the role group will have access to the project based on their level of access to the role group.
  
  <pre>
  arv link create --link '{
@@ -67,7 +67,7 @@ arv link create --link '{
    "head_uuid": "the_project_uuid"}'
  </pre>
  
-A project can also be shared read-only.  In that case, the first link should be created with @can_read@ instead of @can_manage@.
+A project can also be shared read-only.  In that case, the link @name@ should be @can_read@ instead of @can_manage@.
  
  h2. List things shared with the group
  
@@ -78,7 +78,7 @@ arv link list --filters '[["link_class", "=", "permission"],
    ["tail_uuid", "=", "the_group_uuid"]]' | jq .items[].head_uuid
  </pre>
  
-h2. Stop sharing a project with a group
+h2(#stop-sharing-project). Stop sharing a project with a group
  
  This will remove access for members of the group.
  
@@ -91,7 +91,7 @@ arv --format=uuid link list --filters '[["link_class", "=", "permission"],
  arv link delete --uuid each_link_uuid
  </pre>
  
-h2. Remove user from a group
+h2. Remove user from a role group
  
  The first step is to find the permission link objects.  The second step is to delete them.
  
diff --git a/doc/admin/health-checks.html.textile.liquid b/doc/admin/health-checks.html.textile.liquid

index 7c878269645926121c70a3edc1346c16311ca81c..fa273cd204df72cedce38502ba5095ab8c015f4b 100644 (file)
--- a/doc/admin/health-checks.html.textile.liquid
+++ b/doc/admin/health-checks.html.textile.liquid
@@ -29,8 +29,43 @@ Health check endpoints return a JSON object with the field @health@.  This has a
  }
  </pre>
  
-h2. Healthcheck aggregator
+h2. Health check aggregator
  
  The service @arvados-health@ performs health checks on all configured services and returns a single value of @OK@ or @ERROR@ for the entire cluster.  It exposes the endpoint @/_health/all@ .
  
  The healthcheck aggregator uses the @Services@ section of the cluster-wide @config.yml@ configuration file.
+
+h2. Health check command
+
+The @arvados-server check@ command is another way to perform the same health checks as the health check aggregator service. It does not depend on the aggregator service.
+
+If all checks pass, it writes @health check OK@ to stderr (unless the @-quiet@ flag is used) and exits 0. Otherwise, it writes error messages to stderr and exits with error status.
+
+@arvados-server check -yaml@ outputs a YAML document on stdout with additional details about each service endpoint that was checked.
+
+{% codeblock as yaml %}
+Checks:
+  "arvados-api-server+http://localhost:8004/_health/ping":
+    ClockTime: "2022-11-16T16:08:57Z"
+    ConfigSourceSHA256: e2c086ae3dd290cf029cb3fe79146529622279b6280cf6cd17dc8d8c30daa57f
+    ConfigSourceTimestamp: "2022-11-07T18:08:24.539545Z"
+    HTTPStatusCode: 200
+    Health: OK
+    Response:
+      health: OK
+    ResponseTime: 0.017159
+    Server: nginx/1.14.0 + Phusion Passenger(R) 6.0.15
+    Version: 2.5.0~dev20221116141533
+  "arvados-controller+http://localhost:8003/_health/ping":
+    ClockTime: "2022-11-16T16:08:57Z"
+    ConfigSourceSHA256: e2c086ae3dd290cf029cb3fe79146529622279b6280cf6cd17dc8d8c30daa57f
+    ConfigSourceTimestamp: "2022-11-07T18:08:24.539545Z"
+    HTTPStatusCode: 200
+    Health: OK
+    Response:
+      health: OK
+    ResponseTime: 0.004748
+    Server: ""
+    Version: 2.5.0~dev20221116141533 (go1.18.8)
+# ...
+{% endcodeblock %}
diff --git a/doc/admin/maintenance-and-upgrading.html.textile.liquid b/doc/admin/maintenance-and-upgrading.html.textile.liquid

index 480f5114ea135625754e03410a2a20501521f48f..253e82bdc3a2a3e21aa1f38cc493f230a06bd105 100644 (file)
--- a/doc/admin/maintenance-and-upgrading.html.textile.liquid
+++ b/doc/admin/maintenance-and-upgrading.html.textile.liquid
@@ -52,6 +52,8 @@ If you know which Arvados service uses the specific configuration that was modif
  
  To check for services that have not restarted since the configuration file was updated, run the @arvados-server check@ command on each system node.
  
+To test functionality and check for common problems, run the @arvados-client sudo diagnostics@ command on a system node.
+
  h2(#upgrading). Upgrading Arvados
  
  Upgrading Arvados typically involves the following steps:
@@ -60,9 +62,12 @@ Upgrading Arvados typically involves the following steps:
  # Wait for the cluster to be idle and stop Arvados services.
  # Make a backup of your database, as a precaution.
  # update the configuration file for the new release, if necessary (see "Maintaining Arvados":#maintaining above)
-# rebuild and deploy the "compute node image":{{site.baseurl}}/install/crunch2-cloud/install-compute-node.html (cloud only)
+# Update compute nodes
+## (cloud) Rebuild and deploy the "compute node image":{{site.baseurl}}/install/crunch2-cloud/install-compute-node.html
+## (slurm/LSF) Upgrade the @python3-arvados-fuse@ package used on your compute nodes
  # Install new packages using @apt-get upgrade@ or @yum upgrade@.
  # Wait for package installation scripts as they perform any necessary data migrations.
  # Run @arvados-server config-check@ to detect configuration errors or deprecated entries.
  # Verify that the Arvados services were restarted as part of the package upgrades.
  # Run @arvados-server check@ to detect services that did not restart properly.
+# Run @arvados-client sudo diagnostics@ to test functionality.
diff --git a/doc/admin/upgrading.html.textile.liquid b/doc/admin/upgrading.html.textile.liquid

index cfdae50eb246bae8b042d1184e43bed4650c46be..9b1ca90ba4b8c432a5f61643f631f4ccc1756f43 100644 (file)
--- a/doc/admin/upgrading.html.textile.liquid
+++ b/doc/admin/upgrading.html.textile.liquid
@@ -29,9 +29,29 @@ TODO: extract this information based on git commit messages and generate changel
  </notextile>
  
  
-h2(#main). development main (as of 2022-09-21)
+h2(#main). development main (as of 2022-10-31)
  
-"previous: Upgrading to 2.4.3":#v2_4_3
+"previous: Upgrading to 2.4.4":#v2_4_4
+
+h3. Google or OpenID Connect login restricted to trusted clients
+
+If you use OpenID Connect or Google login, and your cluster serves as the @LoginCluster@ in a federation _or_ your users log in from a web application other than the Workbench1 and Workbench2 @ExternalURL@ addresses in your configuration file, the additional web application URLs (e.g., the other clusters' Workbench addresses) must be listed explicitly in @Login.TrustedClients@, otherwise login will fail. Previously, login would succeed with a less-privileged token.
+
+h3. New keepstore S3 driver enabled by default
+
+A more actively maintained S3 client library is now enabled by default for keeepstore services. The previous driver is still available for use in case of unknown issues. To use the old driver, set @DriverParameters.UseAWSS3v2Driver@ to @false@ on the appropriate @Volumes@ config entries.
+
+h3. Old container logs are automatically deleted from PostgreSQL
+
+Cached copies of log entries from containers that finished more than 1 month ago are now deleted automatically (this only affects the "live" logs saved in the PostgreSQL database, not log collections saved in Keep). If you have an existing cron job that runs @rake db:delete_old_container_logs@, you can remove it. See configuration options @Containers.Logging.MaxAge@ and @Containers.Logging.SweepInterval@.
+
+h3. Fixed salt installer template file to support container shell access
+
+If you manage your cluster using the salt installer, you may want to update it to the latest version, use the appropriate @config_examples@ subdirectory and re-reploy with your custom @local.params@ file so that the @arvados-controller@'s @nginx@ configuration file gets fixed.
+
+h3. Login-sync script requires configuration update on LoginCluster federations
+
+If you have @arvados-login-sync@ running on a satellite cluster, please update the environment variable settings by removing the @LOGINCLUSTER_ARVADOS_API_*@ variables and setting @ARVADOS_API_TOKEN@ to a LoginCluster's admin token, as described on the "updated install page":{{site.baseurl}}/install/install-shell-server.html#arvados-login-sync.
  
  h3. Renamed keep-web metrics and WebDAV configs
  
@@ -39,6 +59,12 @@ Metrics previously reported by keep-web (@arvados_keepweb_collectioncache_reques
  
  The config entries @Collections.WebDAVCache.UUIDTTL@, @...MaxCollectionEntries@, and @...MaxUUIDEntries@ are no longer used, and should be removed from your config file.
  
+h2(#v2_4_4). v2.4.4 (2022-11-18)
+
+"previous: Upgrading to 2.4.3":#v2_4_3
+
+This update only consists of improvements to @arvados-cwl-runner@.  There are no changes to backend services.
+
  h2(#v2_4_3). v2.4.3 (2022-09-21)
  
  "previous: Upgrading to 2.4.2":#v2_4_2
diff --git a/doc/api/methods/groups.html.textile.liquid b/doc/api/methods/groups.html.textile.liquid

index db0aac3c7a3570fd0b3b5e9aa2c74dbe9874c196..72fca48560e9398dc7bf62183f320fcbfd1f9ea8 100644 (file)
--- a/doc/api/methods/groups.html.textile.liquid
+++ b/doc/api/methods/groups.html.textile.liquid
@@ -38,7 +38,7 @@ table(table table-bordered table-condensed).
  |is_trashed|datetime|True if @trash_at@ is in the past, false if not.||
  |frozen_by_uuid|string|For a frozen project, indicates the user who froze the project; null in all other cases. When a project is frozen, no further changes can be made to the project or its contents, even by admins. Attempting to add new items or modify, rename, move, trash, or delete the project or its contents, including any subprojects, will return an error.||
  
-h3. Frozen projects
+h3(#frozen). Frozen projects
  
  A user with @manage@ permission can set the @frozen_by_uuid@ attribute of a @project@ group to their own user UUID. Once this is done, no further changes can be made to the project or its contents, including subprojects.
  
diff --git a/doc/api/projects.html.textile.liquid b/doc/api/projects.html.textile.liquid

index 9aa3d85d4d5297adfc91d396a9f8b518d9ff831e..5cb630c43454c24582cb540077051b3b7e847f43 100644 (file)
--- a/doc/api/projects.html.textile.liquid
+++ b/doc/api/projects.html.textile.liquid
@@ -27,7 +27,7 @@ In this command, `zzzzz-tpzed-123456789012345` is a @user@ uuid, which is unusua
  
  Because the home project is a virtual project, other operations via the @groups@ API are not supported.
  
-h2. Filter groups
+h2(#filtergroups). Filter groups
  
  Filter groups are another type of virtual project. They are implemented as an Arvados @group@ object with @group_class@ set to the value "filter".
  
diff --git a/doc/api/properties.html.textile.liquid b/doc/api/properties.html.textile.liquid

new file mode 100644 (file)

index 0000000..bf4b05c
--- /dev/null
+++ b/doc/api/properties.html.textile.liquid
@@ -0,0 +1,50 @@
+---
+layout: default
+navsection: api
+title: "Metadata properties"
+...
+{% comment %}
+Copyright (C) The Arvados Authors. All rights reserved.
+
+SPDX-License-Identifier: CC-BY-SA-3.0
+{% endcomment %}
+
+Arvados allows you to attach arbitrary properties to "collection":methods/collections.html, "container_request":methods/container_requests.html, "link":methods/links.html and "group":methods/groups.html records that have a @properties@ field.  These are key-value pairs, where the value is a valid JSON type (string, number, null, boolean, array, object).
+
+Searching for records using properties is described in "Filtering on subproperties":methods.html#subpropertyfilters .
+
+h2. Reserved properties
+
+The following properties are set by Arvados components.
+
+table(table table-bordered table-condensed).
+|_. Property name|_. Appears on|_. Value type|_.Description|
+|type|collection|string|Appears on collections to indicates the contents or usage. See "Collection type values":#collectiontype below for details.|
+|container_request|collection|string|The UUID of the container request that produced an output or log collection.|
+|docker-image-repo-tag|collection|string|For collections containing a Docker image, the repo/name:tag identifier|
+|container_uuid|collection|string|The UUID of the container that produced a collection (set on collections with type=log)|
+|cwl_input|container_request|object|On an intermediate container request, the CWL workflow-level input parameters used to generate the container request|
+|cwl_output|container_request|object|On an intermediate container request, the CWL workflow-level output parameters collected from the container request|
+|template_uuid|container_request|string|For a workflow runner container request, the workflow record that was used to launch it.|
+|username|link|string|For a "can_login":permission-model.html#links permission link, the unix username on the VM that the user will have.|
+|groups|link|array of string|For a "can_login":permission-model.html#links permission link, the unix groups on the VM that the user will be added to.|
+|image_timestamp|link|string|When resolving a Docker image name and multiple links are found with @link_class=docker_image_repo+tag@ and same @link_name@, the @image_timestamp@ is used to determine precedence (most recent wins).|
+|filters|group|array of array of string|Used to define "filter groups":projects.html#filtergroup|
+
+h3(#collectiontype). Collection "type" values
+
+Meaningful values of the @type@ property.  These are recognized by Workbench when filtering on types of collections from the project content listing.
+
+table(table table-bordered table-condensed).
+|_. Type|_.Description|
+|log|The collection contains log files from a container run.|
+|output|The collection contains the output of a top-level container run (this is a container request where @requesting_container_uuid@  is null).|
+|intermediate|The collection contains the output of a child container run (this is a container request where @requesting_container_uuid@ is non-empty).|
+
+h2. Controlling user-supplied properties
+
+Arvados can be configured with a vocabulary file that lists valid properties and the range of valid values for those properties.  This is described in "Metadata vocabulary":{{site.baseurl}}/admin/metadata-vocabulary.html .
+
+Arvados offers options to set properties automatically and/or prevent certain properties, once set, from being changed by non-admin users.  This is described in "Configuring collection's managed properties":{{site.baseurl}}/admin/collection-managed-properties.html .
+
+The admin can require that certain properties must be non-empty before "freezing a project":methods/groups.html#frozen .
diff --git a/doc/architecture/federation.html.textile.liquid b/doc/architecture/federation.html.textile.liquid

index 1ae8b6006405af727a4d4d22c4ffc99accfd53fa..698e355da626a561448b9ef2814025ded1054620 100644 (file)
--- a/doc/architecture/federation.html.textile.liquid
+++ b/doc/architecture/federation.html.textile.liquid
@@ -36,14 +36,14 @@ Clusters:
    clsr1:
      RemoteClusters:
        clsr2:
-        Host: api.cluster2.com
+        Host: api.cluster2.example
          Proxy: true
        clsr3:
-        Host: api.cluster3.com
+        Host: api.cluster3.example
          Proxy: true
  </pre>
  
-In this example, the cluster @clsr1@ is configured to contact @api.cluster2.com@ for requests involving @clsr2@ and @api.cluster3.com@ for requests involving @clsr3@.
+In this example, the cluster @clsr1@ is configured to contact @api.cluster2.example@ for requests involving @clsr2@ and @api.cluster3.example@ for requests involving @clsr3@.
  
  h2(#identity). Identity
  
diff --git a/doc/install/configure-s3-object-storage.html.textile.liquid b/doc/install/configure-s3-object-storage.html.textile.liquid

index 288a9a48291ff92ca2ad2320348d4474bec300e6..b4e0c1a312fd1b1feb3d0bf27fa9a05b0bc416dc 100644 (file)
--- a/doc/install/configure-s3-object-storage.html.textile.liquid
+++ b/doc/install/configure-s3-object-storage.html.textile.liquid
@@ -51,8 +51,9 @@ h2(#example). Configuration example
            AccessKeyID: <span class="userinput">""</span>
            SecretAccessKey: <span class="userinput">""</span>
  
-          # Storage provider region. For Google Cloud Storage, use ""
-          # or omit.
+          # Storage provider region. If Endpoint is specified, the
+          # region determines the request signing method, and defaults
+          # to "us-east-1".
            Region: <span class="userinput">us-east-1</span>
  
            # Storage provider endpoint. For Amazon S3, use "" or
diff --git a/doc/install/crunch2-cloud/install-dispatch-cloud.html.textile.liquid b/doc/install/crunch2-cloud/install-dispatch-cloud.html.textile.liquid

index 4f872911b481fa2d0be96281933edc70033bdab6..198925c7bda33a77352304ee124ab9875ff0f182 100644 (file)
--- a/doc/install/crunch2-cloud/install-dispatch-cloud.html.textile.liquid
+++ b/doc/install/crunch2-cloud/install-dispatch-cloud.html.textile.liquid
@@ -380,39 +380,27 @@ h2(#confirm-working). Confirm working installation
  On the dispatch node, start monitoring the arvados-dispatch-cloud logs:
  
  <notextile>
-<pre><code>~$ <span class="userinput">sudo journalctl -o cat -fu arvados-dispatch-cloud.service</span>
+<pre><code># <span class="userinput">journalctl -o cat -fu arvados-dispatch-cloud.service</span>
  </code></pre>
  </notextile>
  
-"Make sure to install the arvados/jobs image.":../install-jobs-image.html
-
-Submit a simple container request:
+In another terminal window, use the diagnostics tool to run a simple container.
  
  <notextile>
-<pre><code>shell:~$ <span class="userinput">arv container_request create --container-request '{
-  "name":            "test",
-  "state":           "Committed",
-  "priority":        1,
-  "container_image": "arvados/jobs:latest",
-  "command":         ["echo", "Hello, Crunch!"],
-  "output_path":     "/out",
-  "mounts": {
-    "/out": {
-      "kind":        "tmp",
-      "capacity":    1000
-    }
-  },
-  "runtime_constraints": {
-    "vcpus": 1,
-    "ram": 1048576
-  }
-}'</span>
+<pre><code># <span class="userinput">arvados-client sudo diagnostics</span>
+INFO       5: running health check (same as `arvados-server check`)
+INFO      10: getting discovery document from https://zzzzz.arvadosapi.com/discovery/v1/apis/arvados/v1/rest
+...
+INFO     160: running a container
+INFO      ... container request submitted, waiting up to 10m for container to run
  </code></pre>
  </notextile>
  
-This command should return a record with a @container_uuid@ field.  Once @arvados-dispatch-cloud@ polls the API server for new containers to run, you should see it dispatch that same container.
+After performing a number of other quick tests, this will submit a new container request and wait for it to finish.
+
+While the diagnostics tool is waiting, the @arvados-dispatch-cloud@ logs will show details about creating a cloud instance, waiting for it to be ready, and scheduling the new container on it.
  
-The @arvados-dispatch-cloud@ API provides a list of queued and running jobs and cloud instances. Use your @ManagementToken@ to test the dispatcher's endpoint. For example, when one container is running:
+You can also use the "arvados-dispatch-cloud API":{{site.baseurl}}/api/dispatch.html to get a list of queued and running jobs and cloud instances. Use your @ManagementToken@ to test the dispatcher's endpoint. For example, when one container is running:
  
  <notextile>
  <pre><code>~$ <span class="userinput">curl -sH "Authorization: Bearer $token" http://localhost:9006/arvados/v1/dispatch/containers</span>
@@ -452,8 +440,6 @@ The @arvados-dispatch-cloud@ API provides a list of queued and running jobs and
  
  A similar request can be made to the @http://localhost:9006/arvados/v1/dispatch/instances@ endpoint.
  
-When the container finishes, the dispatcher will log it.
-
  After the container finishes, you can get the container record by UUID *from a shell server* to see its results:
  
  <notextile>
diff --git a/doc/install/crunch2-lsf/install-dispatch.html.textile.liquid b/doc/install/crunch2-lsf/install-dispatch.html.textile.liquid

index 37adffd18d4e9bef5162614b015a3155df3333a5..d4328d89a3f55b98d909108329bc9f0782ec7718 100644 (file)
--- a/doc/install/crunch2-lsf/install-dispatch.html.textile.liquid
+++ b/doc/install/crunch2-lsf/install-dispatch.html.textile.liquid
@@ -62,7 +62,7 @@ Alternatively, you can arrange for the arvados-dispatch-lsf process to run as an
  </notextile>
  
  
-h3(#SbatchArguments). Containers.LSF.BsubArgumentsList
+h3(#BsubArgumentsList). Containers.LSF.BsubArgumentsList
  
  When arvados-dispatch-lsf invokes @bsub@, you can add arguments to the command by specifying @BsubArgumentsList@.  You can use this to send the jobs to specific cluster partitions or add resource requests.  Set @BsubArgumentsList@ to an array of strings.
  
@@ -87,7 +87,7 @@ For example:
  
  Note that the default value for @BsubArgumentsList@ uses the @-o@ and @-e@ arguments to write stdout/stderr data to files in @/tmp@ on the compute nodes, which is helpful for troubleshooting installation/configuration problems. Ensure you have something in place to delete old files from @/tmp@, or adjust these arguments accordingly.
  
-h3(#SbatchArguments). Containers.LSF.BsubCUDAArguments
+h3(#BsubCUDAArguments). Containers.LSF.BsubCUDAArguments
  
  If the container requests access to GPUs (@runtime_constraints.cuda.device_count@ of the container request is greater than zero), the command line arguments in @BsubCUDAArguments@ will be added to the command line _after_ @BsubArgumentsList@.  This should consist of the additional @bsub@ flags your site requires to schedule the job on a node with GPU support.  Set @BsubCUDAArguments@ to an array of strings.  For example:
  
@@ -98,7 +98,7 @@ If the container requests access to GPUs (@runtime_constraints.cuda.device_count
  </pre>
  </notextile>
  
-h3(#PollPeriod). Containers.PollInterval
+h3(#PollInterval). Containers.PollInterval
  
  arvados-dispatch-lsf polls the API server periodically for new containers to run.  The @PollInterval@ option controls how often this poll happens.  Set this to a string of numbers suffixed with one of the time units @s@, @m@, or @h@.  For example:
  
@@ -122,7 +122,7 @@ Supports suffixes @KB@, @KiB@, @MB@, @MiB@, @GB@, @GiB@, @TB@, @TiB@, @PB@, @PiB
  </notextile>
  
  
-h3(#CrunchRunCommand-network). Containers.CrunchRunArgumentList: Using host networking for containers
+h3(#CrunchRunArgumentList). Containers.CrunchRunArgumentList: Using host networking for containers
  
  Older Linux kernels (prior to 3.18) have bugs in network namespace handling which can lead to compute node lockups.  This by is indicated by blocked kernel tasks in "Workqueue: netns cleanup_net".   If you are experiencing this problem, as a workaround you can disable use of network namespaces by Docker across the cluster.  Be aware this reduces container isolation, which may be a security risk.
  
@@ -134,6 +134,37 @@ Older Linux kernels (prior to 3.18) have bugs in network namespace handling whic
  </pre>
  </notextile>
  
+
+h3(#InstanceTypes). InstanceTypes: Avoid submitting jobs with unsatisfiable resource constraints
+
+LSF does not provide feedback when a submitted job's RAM, CPU, or disk space constraints cannot be satisfied by any node: the job will wait in the queue indefinitely with "pending" status, reported by Arvados as "queued".
+
+As a workaround, you can configure @InstanceTypes@ with your LSF cluster's compute node sizes. Arvados will use these sizes to determine when a container is impossible to run, and cancel it instead of submitting an LSF job.
+
+Apart from detecting non-runnable containers, the configured instance types will not have any effect on scheduling.
+
+<notextile>
+<pre>    InstanceTypes:
+      most-ram:
+        VCPUs: 8
+        RAM: 640GiB
+        IncludedScratch: 640GB
+      most-cpus:
+        VCPUs: 32
+        RAM: 256GiB
+        IncludedScratch: 640GB
+      gpu:
+        VCPUs: 8
+        RAM: 256GiB
+        IncludedScratch: 640GB
+        CUDA:
+          DriverVersion: "11.4"
+          HardwareCapability: "7.5"
+          DeviceCount: 1
+</pre>
+</notextile>
+
+
  {% assign arvados_component = 'arvados-dispatch-lsf' %}
  
  {% include 'install_packages' %}
@@ -141,3 +172,28 @@ Older Linux kernels (prior to 3.18) have bugs in network namespace handling whic
  {% include 'start_service' %}
  
  {% include 'restart_api' %}
+
+h2(#confirm-working). Confirm working installation
+
+On the dispatch node, start monitoring the arvados-dispatch-lsf logs:
+
+<notextile>
+<pre><code># <span class="userinput">journalctl -o cat -fu arvados-dispatch-lsf.service</span>
+</code></pre>
+</notextile>
+
+In another terminal window, use the diagnostics tool to run a simple container.
+
+<notextile>
+<pre><code># <span class="userinput">arvados-client sudo diagnostics</span>
+INFO       5: running health check (same as `arvados-server check`)
+INFO      10: getting discovery document from https://zzzzz.arvadosapi.com/discovery/v1/apis/arvados/v1/rest
+...
+INFO     160: running a container
+INFO      ... container request submitted, waiting up to 10m for container to run
+</code></pre>
+</notextile>
+
+After performing a number of other quick tests, this will submit a new container request and wait for it to finish.
+
+While the diagnostics tool is waiting, the @arvados-dispatch-lsf@ logs will show details about submitting an LSF job to run the container.
diff --git a/doc/install/crunch2-slurm/install-test.html.textile.liquid b/doc/install/crunch2-slurm/install-test.html.textile.liquid

index dc13c3c0f503db2c4a5a6df7a7998364d4e99c8e..ffd75a779378b61aefc6ab4c949d7a5129ab0f12 100644 (file)
--- a/doc/install/crunch2-slurm/install-test.html.textile.liquid
+++ b/doc/install/crunch2-slurm/install-test.html.textile.liquid
@@ -31,35 +31,23 @@ Make sure all of your compute nodes are set up with "Docker":../crunch2/install-
  On the dispatch node, start monitoring the crunch-dispatch-slurm logs:
  
  <notextile>
-<pre><code>~$ <span class="userinput">sudo journalctl -o cat -fu crunch-dispatch-slurm.service</span>
+<pre><code># <span class="userinput">journalctl -o cat -fu crunch-dispatch-slurm.service</span>
  </code></pre>
  </notextile>
  
-Submit a simple container request:
+In another terminal window, use the diagnostics tool to run a simple container.
  
  <notextile>
-<pre><code>shell:~$ <span class="userinput">arv container_request create --container-request '{
-  "name":            "test",
-  "state":           "Committed",
-  "priority":        1,
-  "container_image": "arvados/jobs:latest",
-  "command":         ["echo", "Hello, Crunch!"],
-  "output_path":     "/out",
-  "mounts": {
-    "/out": {
-      "kind":        "tmp",
-      "capacity":    1000
-    }
-  },
-  "runtime_constraints": {
-    "vcpus": 1,
-    "ram": 8388608
-  }
-}'</span>
+<pre><code># <span class="userinput">arvados-client sudo diagnostics</span>
+INFO       5: running health check (same as `arvados-server check`)
+INFO      10: getting discovery document from https://zzzzz.arvadosapi.com/discovery/v1/apis/arvados/v1/rest
+...
+INFO     160: running a container
+INFO      ... container request submitted, waiting up to 10m for container to run
  </code></pre>
  </notextile>
  
-This command should return a record with a @container_uuid@ field.  Once @crunch-dispatch-slurm@ polls the API server for new containers to run, you should see it dispatch that same container.  It will log messages like:
+Once @crunch-dispatch-slurm@ polls the API server for new containers to run, you should see it dispatch the new container.  It will log messages like:
  
  <notextile>
  <pre><code>2016/08/05 13:52:54 Monitoring container zzzzz-dz642-hdp2vpu9nq14tx0 started
diff --git a/doc/install/install-shell-server.html.textile.liquid b/doc/install/install-shell-server.html.textile.liquid

index bdf9f4b59a63188f4f94ecb17d363ce393833c59..57b79d2042311805b1b7ea909e17d2e6e7e8fcc4 100644 (file)
--- a/doc/install/install-shell-server.html.textile.liquid
+++ b/doc/install/install-shell-server.html.textile.liquid
@@ -23,13 +23,13 @@ Arvados support for shell nodes allows you to use Arvados permissions to grant L
  
  A shell node runs the @arvados-login-sync@ service to manage user accounts, and typically has Arvados utilities and SDKs pre-installed.  Users are allowed to log in and run arbitrary programs.  For optimal performance, the Arvados shell server should be on the same LAN as the Arvados cluster.
  
-Because Arvados @config.yml@ _contains secrets_ it should not *not* be present on shell nodes.
+Because Arvados @config.yml@ _contains secrets_ it should *not* be present on shell nodes.
  
  Shell nodes should be separate virtual machines from the VMs running other Arvados services.  You may choose to grant root access to users so that they can customize the node, for example, installing new programs.  This has security considerations depending on whether a shell node is single-user or multi-user.
  
  A single-user shell node should be set up so that it only stores Arvados access tokens that belong to that user.  In that case, that user can be safely granted root access without compromising other Arvados users.
  
-In the multi-user shell node case, a malicious user with @root@ access could access other user's Arvados tokens.  Users should only be given @root@ access on a multi-user shell node if you would trust them them to be Arvados administrators.  Be aware that with access to the @docker@ daemon, it is trival to gain *root* access to any file on the system, so giving users @docker@ access should be considered equivalent to @root@ access.
+In the multi-user shell node case, a malicious user with @root@ access could access other user's Arvados tokens.  Users should only be given @root@ access on a multi-user shell node if you would trust them to be Arvados administrators.  Be aware that with access to the @docker@ daemon, it is trival to gain *root* access to any file on the system, so giving users @docker@ access should be considered equivalent to @root@ access.
  
  h2(#dependencies). Install Dependencies and SDKs
  
@@ -101,17 +101,15 @@ EOF</span></code>
  </pre>
  </notextile>
  
-h3. Part of a LoginCLuster federation
+h3. Part of a LoginCluster federation
  
-If this cluster is part of a "federation with centralized user management":../admin/federation.html#LoginCluster , the login sync script also needs to be given the host and user token for the login cluster.
+If the cluster is part of a "federation with centralized user management":../admin/federation.html#LoginCluster , the login sync script needs to be given an admin token from the login cluster.
  
  <notextile>
  <pre>
  <code>shellserver:# <span class="userinput">umask 0700; tee /etc/cron.d/arvados-login-sync &lt;&lt;EOF
  ARVADOS_API_HOST="<strong>ClusterID.example.com</strong>"
-ARVADOS_API_TOKEN="<strong>xxxxxxxxxxxxxxxxx</strong>"
-LOGINCLUSTER_ARVADOS_API_HOST="<strong>LoginClusterID.example.com</strong>"
-LOGINCLUSTER_ARVADOS_API_TOKEN="<strong>yyyyyyyyyyyyyyyyy</strong>"
+ARVADOS_API_TOKEN="<strong>yyyloginclusteradmintokenyyyy</strong>"
  ARVADOS_VIRTUAL_MACHINE_UUID="<strong>zzzzz-2x53u-zzzzzzzzzzzzzzz</strong>"
  */2 * * * * root arvados-login-sync
  EOF</span></code>
diff --git a/doc/sdk/index.html.textile.liquid b/doc/sdk/index.html.textile.liquid

index 0bfe7ea72aa2a94380aad4c9b7180c2ecbf35aed..b733d03bfc37d5152afdb3a3d515a9e66e4e4d23 100644 (file)
--- a/doc/sdk/index.html.textile.liquid
+++ b/doc/sdk/index.html.textile.liquid
@@ -17,6 +17,5 @@ This section documents language bindings for the "Arvados API":{{site.baseurl}}/
  * "R SDK":{{site.baseurl}}/sdk/R/index.html
  * "Ruby SDK":{{site.baseurl}}/sdk/ruby/index.html
  * "Java SDK v2":{{site.baseurl}}/sdk/java-v2/index.html
-* "Perl SDK":{{site.baseurl}}/sdk/perl/index.html
  
  Many Arvados Workbench pages, under the *Advanced* tab, provide examples of API and SDK use for accessing the current resource .
diff --git a/doc/sdk/perl/example.html.textile.liquid b/doc/sdk/perl/example.html.textile.liquid

deleted file mode 100644 (file)

index b51cfe4..0000000
--- a/doc/sdk/perl/example.html.textile.liquid
+++ /dev/null
@@ -1,77 +0,0 @@
----
-layout: default
-navsection: sdk
-navmenu: Perl
-title: "Examples"
-...
-{% comment %}
-Copyright (C) The Arvados Authors. All rights reserved.
-
-SPDX-License-Identifier: CC-BY-SA-3.0
-{% endcomment %}
-
-h2. Initialize SDK
-
-Set up an API client user agent:
-
-{% codeblock as perl %}
-use Arvados;
-my $arv = Arvados->new('apiVersion' => 'v1');
-{% endcodeblock %}
-
-The SDK retrieves the list of API methods from the server at run time. Therefore, the set of available methods is determined by the server version rather than the SDK version.
-
-h2. create
-
-Create an object:
-
-{% codeblock as perl %}
-my $test_link = $arv->{'links'}->{'create'}->execute('link' => { 'link_class' => 'test', 'name' => 'test' });
-{% endcodeblock %}
-
-h2. delete
-
-{% codeblock as perl %}
-my $some_user = $arv->{'collections'}->{'get'}->execute('uuid' => $collection_uuid);
-{% endcodeblock %}
-
-h2. get
-
-Retrieve an object by ID:
-
-{% codeblock as perl %}
-my $some_user = $arv->{'users'}->{'get'}->execute('uuid' => $current_user_uuid);
-{% endcodeblock %}
-
-Get the UUID of an object that was retrieved using the SDK:
-
-{% codeblock as perl %}
-my $current_user_uuid = $current_user->{'uuid'}
-{% endcodeblock %}
-
-h2. list
-
-Get a list of objects:
-
-{% codeblock as perl %}
-my $repos = $arv->{'repositories'}->{'list'}->execute;
-print ("UUID of first repo returned is ", $repos->{'items'}->[0], "\n");
-{% endcodeblock %}
-
-h2. update
-
-Update an object:
-
-{% codeblock as perl %}
-my $test_link = $arv->{'links'}->{'update'}->execute(
-        'uuid' => $test_link->{'uuid'},
-        'link' => { 'properties' => { 'foo' => 'bar' } });
-{% endcodeblock %}
-
-h2. Get current user
-
-Get the User object for the current user:
-
-{% codeblock as perl %}
-my $current_user = $arv->{'users'}->{'current'}->execute;
-{% endcodeblock %}
diff --git a/doc/sdk/perl/index.html.textile.liquid b/doc/sdk/perl/index.html.textile.liquid

deleted file mode 100644 (file)

index ba01352..0000000
--- a/doc/sdk/perl/index.html.textile.liquid
+++ /dev/null
@@ -1,66 +0,0 @@
----
-layout: default
-navsection: sdk
-navmenu: Perl
-title: "Installation"
-...
-{% comment %}
-Copyright (C) The Arvados Authors. All rights reserved.
-
-SPDX-License-Identifier: CC-BY-SA-3.0
-{% endcomment %}
-
-The Perl SDK provides a generic set of wrappers so you can make API calls easily.
-
-This is a legacy SDK.  It is no longer used or maintained regularly.
-
-h3. Installation
-
-h4. Option 1: Install from distribution packages
-
-First, "add the appropriate package repository for your distribution":{{ site.baseurl }}/install/install-manual-prerequisites.html#repos.
-
-On Debian-based systems:
-
-<notextile>
-<pre><code>~$ <span class="userinput">sudo apt-get install libjson-perl libio-socket-ssl-perl libwww-perl libipc-system-simple-perl libarvados-perl</code>
-</code></pre>
-</notextile>
-
-On Red Hat-based systems:
-
-<notextile>
-<pre><code>~$ <span class="userinput">sudo yum install perl-ExtUtils-MakeMaker perl-JSON perl-IO-Socket-SSL perl-Crypt-SSLeay perl-WWW-Curl libarvados-perl</code>
-</code></pre>
-</notextile>
-
-h4. Option 2: Install from source
-
-First, install dependencies from your distribution.  Refer to the package lists above, but don't install @libarvados-perl@.
-
-Then run the following:
-
-<notextile>
-<pre><code>~$ <span class="userinput">git clone https://github.com/arvados/arvados.git</span>
-~$ <span class="userinput">cd arvados/sdk/perl</span>
-~$ <span class="userinput">perl Makefile.PL</span>
-~$ <span class="userinput">sudo make install</span>
-</code></pre>
-</notextile>
-
-h3. Test installation
-
-If the SDK is installed, @perl -MArvados -e ''@ should produce no errors.
-
-If your @ARVADOS_API_HOST@ and @ARVADOS_API_TOKEN@ environment variables are set up correctly (see "api-tokens":{{site.baseurl}}/user/reference/api-tokens.html for details), the following test script should work:
-
-<notextile>
-<pre>~$ <code class="userinput">perl &lt;&lt;'EOF'
-use Arvados;
-my $arv = Arvados-&gt;new('apiVersion' => 'v1');
-my $me = $arv-&gt;{'users'}-&gt;{'current'}-&gt;execute;
-print ("arvados.v1.users.current.full_name = '", $me-&gt;{'full_name'}, "'\n");
-EOF</code>
-arvados.v1.users.current.full_name = 'Your Name'
-</pre>
-</notextile>
diff --git a/doc/sdk/python/cookbook.html.textile.liquid b/doc/sdk/python/cookbook.html.textile.liquid

index f3186ebbb6d76d66221860f669960cb9737688eb..53330dcbebbaf762cd1a557200e2b204ad8774a6 100644 (file)
--- a/doc/sdk/python/cookbook.html.textile.liquid
+++ b/doc/sdk/python/cookbook.html.textile.liquid
@@ -10,14 +10,36 @@ Copyright (C) The Arvados Authors. All rights reserved.
  SPDX-License-Identifier: CC-BY-SA-3.0
  {% endcomment %}
  
-h2. Cancel a container request
+# "Cancel a container request":#cancel-a-container-request
+# "Cancel all container requests":#cancel-all-container-requests
+# "List completed container requests":#list-completed-container-requests
+# "Get input of a CWL workflow":#get-input-of-a-cwl-workflow
+# "Get output of a CWL workflow":#get-output-of-a-cwl-workflow
+# "Get state of a CWL workflow":#get-state-of-a-cwl-workflow
+# "List input of child requests":#list-input-of-child-requests
+# "List output of child requests":#list-output-of-child-requests
+# "List failed child requests":#list-failed-child-requests
+# "Get log of a child request":#get-log-of-a-child-request
+# "Create a collection sharing link":#sharing-link
+# "Combine two or more collections":#combine-two-or-more-collections
+# "Upload a file into a new collection":#upload-a-file-into-a-new-collection
+# "Download a file from a collection":#download-a-file-from-a-collection
+# "Copy files from a collection to a new collection":#copy-files-from-a-collection-to-a-new-collection
+# "Copy files from a collection to another collection":#copy-files-from-a-collection-to-another-collection
+# "Delete a file from an existing collection":#delete-a-file-from-an-existing-collection
+# "Listing records with paging":#listing-records-with-paging
+# "Querying the vocabulary definition":#querying-the-vocabulary-definition
+# "Translating between vocabulary identifiers and labels":#translating-between-vocabulary-identifiers-and-labels
+# "Create a Project":#create-a-project
+
+h2(#cancel-a-container-request). Cancel a container request
  
  {% codeblock as python %}
  import arvados
  arvados.api().container_requests().update(uuid=container_request_uuid, body={"priority": 0}).execute()
  {% endcodeblock %}
  
-h2. Cancel all container requests
+h2(#cancel-all-container-requests). Cancel all container requests
  
  {% codeblock as python %}
  import arvados
@@ -27,7 +49,7 @@ for container_request in result:
      api.container_requests().update(uuid=container_request["uuid"], body={"priority": 0}).execute()
  {% endcodeblock %}
  
-h2. List completed container requests
+h2(#list-completed-container-requests). List completed container requests
  
  {% codeblock as python %}
  import arvados
@@ -42,7 +64,7 @@ for container_request in result:
      print("%s, %s, %s" % (container_request["uuid"], container_request["name"], "Success" if container["exit_code"] == 0 else "Failed"))
  {% endcodeblock %}
  
-h2. Get input of a CWL workflow
+h2(#get-input-of-a-cwl-workflow). Get input of a CWL workflow
  
  {% codeblock as python %}
  import arvados
@@ -52,7 +74,7 @@ container_request = api.container_requests().get(uuid=container_request_uuid).ex
  print(container_request["mounts"]["/var/lib/cwl/cwl.input.json"])
  {% endcodeblock %}
  
-h2. Get output of a CWL workflow
+h2(#get-output-of-a-cwl-workflow). Get output of a CWL workflow
  
  {% codeblock as python %}
  import arvados
@@ -64,7 +86,7 @@ collection = arvados.collection.CollectionReader(container_request["output_uuid"
  print(collection.open("cwl.output.json").read())
  {% endcodeblock %}
  
-h2. Get state of a CWL workflow
+h2(#get-state-of-a-cwl-workflow). Get state of a CWL workflow
  
  {% codeblock as python %}
  import arvados
@@ -93,7 +115,7 @@ container_request_uuid = 'zzzzz-xvhdp-zzzzzzzzzzzzzzz'
  print(get_cr_state(container_request_uuid))
  {% endcodeblock %}
  
-h2. List input of child requests
+h2(#list-input-of-child-requests). List input of child requests
  
  {% codeblock as python %}
  import arvados
@@ -112,7 +134,7 @@ for c in child_requests["items"]:
              print("  %s" % m["portable_data_hash"])
  {% endcodeblock %}
  
-h2. List output of child requests
+h2(#list-output-of-child-requests). List output of child requests
  
  {% codeblock as python %}
  import arvados
@@ -131,7 +153,7 @@ for c in child_requests["items"]:
      print("%s -> %s" % (c["name"], uuid_to_pdh[c["output_uuid"]]))
  {% endcodeblock %}
  
-h2. List failed child requests
+h2(#list-failed-child-requests). List failed child requests
  
  {% codeblock as python %}
  import arvados
@@ -149,7 +171,7 @@ for c in cancelled_child_containers["items"]:
      print("%s (%s)" % (child_containers[c["uuid"]]["name"], child_containers[c["uuid"]]["uuid"]))
  {% endcodeblock %}
  
-h2. Get log of a child request
+h2(#get-log-of-a-child-request). Get log of a child request
  
  {% codeblock as python %}
  import arvados
@@ -177,7 +199,7 @@ token = api.api_client_authorizations().create(body={"api_client_authorization":
  print("%s/c=%s/t=%s/_/" % (download, collection_uuid, token["api_token"]))
  {% endcodeblock %}
  
-h2. Combine two or more collections
+h2(#combine-two-or-more-collections). Combine two or more collections
  
  Note, if two collections have files of the same name, the contents will be concatenated in the resulting manifest.
  
@@ -185,7 +207,7 @@ Note, if two collections have files of the same name, the contents will be conca
  import arvados
  import arvados.collection
  api = arvados.api()
-project_uuid = "zzzzz-tpzed-zzzzzzzzzzzzzzz"
+project_uuid = "zzzzz-j7d0g-zzzzzzzzzzzzzzz"
  collection_uuids = ["zzzzz-4zz18-aaaaaaaaaaaaaaa", "zzzzz-4zz18-bbbbbbbbbbbbbbb"]
  combined_manifest = ""
  for u in collection_uuids:
@@ -195,7 +217,7 @@ newcol = arvados.collection.Collection(combined_manifest)
  newcol.save_new(name="My combined collection", owner_uuid=project_uuid)
  {% endcodeblock %}
  
-h2. Upload a file into a new collection
+h2(#upload-a-file-into-a-new-collection). Upload a file into a new collection
  
  {% codeblock as python %}
  import arvados
@@ -217,7 +239,7 @@ c.save_new(name=collection_name, owner_uuid=project_uuid)
  print("Saved %s to %s" % (collection_name, c.manifest_locator()))
  {% endcodeblock %}
  
-h2. Download a file from a collection
+h2(#download-a-file-from-a-collection). Download a file from a collection
  
  {% codeblock as python %}
  import arvados
@@ -237,7 +259,7 @@ with c.open(filename, "rb") as reader:
  print("Finished downloading %s" % filename)
  {% endcodeblock %}
  
-h2. Copy files from a collection to a new collection
+h2(#copy-files-from-a-collection-to-a-new-collection). Copy files from a collection to a new collection
  
  {% codeblock as python %}
  import arvados.collection
@@ -258,7 +280,7 @@ target.save_new(name=target_name, owner_uuid=target_project)
  print("Created collection %s" % target.manifest_locator())
  {% endcodeblock %}
  
-h2. Copy files from a collection to another collection
+h2(#copy-files-from-a-collection-to-another-collection). Copy files from a collection to another collection
  
  {% codeblock as python %}
  import arvados.collection
@@ -277,7 +299,7 @@ for f in files_to_copy:
  target.save()
  {% endcodeblock %}
  
-h2. Delete a file from an existing collection
+h2(#delete-a-file-from-an-existing-collection). Delete a file from an existing collection
  
  {% codeblock as python %}
  import arvados
@@ -287,7 +309,7 @@ c.remove("file2.txt")
  c.save()
  {% endcodeblock %}
  
-h2. Listing records with paging
+h2(#listing-records-with-paging). Listing records with paging
  
  Use the @arvados.util.keyset_list_all@ helper method to iterate over all the records matching an optional filter.  This method handles paging internally and returns results incrementally using a Python iterator.  The first parameter of the method takes a @list@ method of an Arvados resource (@collections@, @container_requests@, etc).
  
@@ -299,7 +321,7 @@ for c in arvados.util.keyset_list_all(api.collections().list, filters=[["name",
      print("got collection " + c["uuid"])
  {% endcodeblock %}
  
-h2. Querying the vocabulary definition
+h2(#querying-the-vocabulary-definition). Querying the vocabulary definition
  
  The Python SDK provides facilities to interact with the "active metadata vocabulary":{{ site.baseurl }}/admin/metadata-vocabulary.html in the system. The developer can do key and value lookups in a case-insensitive manner:
  
@@ -319,7 +341,7 @@ voc['size']['Small'].identifier
  # Example output: 'IDVALSIZES2'
  {% endcodeblock %}
  
-h2. Translating between vocabulary identifiers and labels
+h2(#translating-between-vocabulary-identifiers-and-labels). Translating between vocabulary identifiers and labels
  
  Client software might need to present properties to the user in a human-readable form or take input from the user without requiring them to remember identifiers. For these cases, there're a couple of conversion methods that take a dictionary as input like this:
  
@@ -331,4 +353,22 @@ voc.convert_to_labels({'IDTAGIMPORTANCES': 'IDVALIMPORTANCES1'})
  # Example output: {'Importance': 'Critical'}
  voc.convert_to_identifiers({'creature': 'elephant'})
  # Example output: {'IDTAGANIMALS': 'IDVALANIMALS3'}
-{% endcodeblock %}
-\ No newline at end of file
+{% endcodeblock %}
+
+h2(#create-a-project). Create a Project
+
+{% codeblock as python %}
+import arvados
+
+parent_project_uuid = "zzzzz-j7d0g-zzzzzzzzzzzzzzz"
+project_name = "My project"
+
+g = arvados.api().groups().create(body={
+  "group": {
+    "group_class": "project",
+    "owner_uuid": parent_project_uuid,
+    "name": project_name,
+  }}).execute()
+
+print("New project uuid is", g["uuid"])
+{% endcodeblock %}
diff --git a/doc/user/cwl/cwl-run-options.html.textile.liquid b/doc/user/cwl/cwl-run-options.html.textile.liquid

index 94e46ae1bc3487179dc1a72167d2d8bf94235085..703ec89139baf45afcafc8cf84c93b304ecee2b1 100644 (file)
--- a/doc/user/cwl/cwl-run-options.html.textile.liquid
+++ b/doc/user/cwl/cwl-run-options.html.textile.liquid
@@ -38,34 +38,40 @@ table(table table-bordered table-condensed).
  |==--output-name OUTPUT_NAME==|Name to use for collection that stores the final output.|
  |==--output-tags OUTPUT_TAGS==|Tags for the final output collection separated by commas, e.g., =='--output-tags tag0,tag1,tag2'==.|
  |==--ignore-docker-for-reuse==|Ignore Docker image version when deciding whether to reuse past containers.|
-|==--submit==|              Submit workflow runner to Arvados to manage the workflow (default).|
-|==--local==|               Run workflow on local host (still submits containers to Arvados).|
+|==--submit==|              Submit workflow to run on Arvados.|
+|==--local==|               Run workflow on local host (submits containers to Arvados).|
  |==--create-template==|     (Deprecated) synonym for --create-workflow.|
  |==--create-workflow==|     Register an Arvados workflow that can be run from Workbench|
-|==--update-workflow== UUID|Update an existing Arvados workflow or pipeline template with the given UUID.|
+|==--update-workflow== UUID|Update an existing Arvados workflow with the given UUID.|
  |==--wait==|                After submitting workflow runner, wait for completion.|
  |==--no-wait==|             Submit workflow runner and exit.|
  |==--log-timestamps==|      Prefix logging lines with timestamp|
  |==--no-log-timestamps==|   No timestamp on logging lines|
  |==--compute-checksum==|    Compute checksum of contents while collecting outputs|
-|==--submit-runner-ram== SUBMIT_RUNNER_RAM|RAM (in MiB) required for the workflow runner (default 1024)|
-|==--submit-runner-image== SUBMIT_RUNNER_IMAGE|Docker image for workflow runner|
+|==--submit-runner-ram== SUBMIT_RUNNER_RAM|RAM (in MiB) required for the workflow runner job (default 1024)|
+|==--submit-runner-image== SUBMIT_RUNNER_IMAGE|Docker image for workflow runner job|
  |==--always-submit-runner==|When invoked with --submit --wait, always submit a runner to manage the workflow, even when only running a single CommandLineTool|
  |==--match-submitter-images==|Where Arvados has more than one Docker image of the same name, use image from the Docker instance on the submitting node.|
  |==--submit-request-uuid== UUID|Update and commit to supplied container request instead of creating a new one.|
  |==--submit-runner-cluster== CLUSTER_ID|Submit workflow runner to a remote cluster|
-|==--name NAME==|Name to use for workflow execution instance.|
+|==--collection-cache-size== COLLECTION_CACHE_SIZE|Collection cache size (in MiB, default 256).|
+|==--name== NAME|Name to use for workflow execution instance.|
  |==--on-error== {stop,continue}|Desired workflow behavior when a step fails.  One of 'stop' (do not submit any more steps) or 'continue' (may submit other steps that are not downstream from the error). Default is 'continue'.|
-|==--enable-dev==|Enable loading and running development versions of CWL spec.|
-|==--storage-classes== STORAGE_CLASSES|Specify comma separated list of storage classes to be used when saving the final workflow output to Keep.|
-|==--intermediate-storage-classes== STORAGE_CLASSES|Specify comma separated list of storage classes to be used when intermediate workflow output to Keep.|
+|==--enable-dev==|Enable loading and running development versions of the CWL standards.|
+|==--storage-classes== STORAGE_CLASSES|Specify comma separated list of storage classes to be used when saving final workflow output to Keep.|
+|==--intermediate-storage-classes== INTERMEDIATE_STORAGE_CLASSES|Specify comma separated list of storage classes to be used when saving intermediate workflow output to Keep.|
  |==--intermediate-output-ttl== N|If N > 0, intermediate output collections will be trashed N seconds after creation. Default is 0 (don't trash).|
  |==--priority== PRIORITY|Workflow priority (range 1..1000, higher has precedence over lower)|
-|==--thread-count== THREAD_COUNT|Number of threads to use for container submit and output collection.|
+|==--thread-count== THREAD_COUNT|Number of threads to use for job submit and output collection.|
  |==--http-timeout== HTTP_TIMEOUT|API request timeout in seconds. Default is 300 seconds (5 minutes).|
-|==--enable-preemptible==|Use preemptible instances. Control individual steps with "arv:UsePreemptible":cwl-extensions.html#UsePreemptible hint.|
+|==--defer-downloads==|When submitting a workflow, defer downloading HTTP URLs to workflow launch instead of downloading to Keep before submit.|
+|==--varying-url-params== VARYING_URL_PARAMS|A comma separated list of URL query parameters that should be ignored when storing HTTP URLs in Keep.|
+|==--prefer-cached-downloads==|If a HTTP URL is found in Keep, skip upstream URL freshness check (will not notice if the upstream has changed, but also not error if upstream is unavailable).|
+|==--enable-preemptible==|Use preemptible instances. Control individual steps with arv:UsePreemptible hint.|
  |==--disable-preemptible==|Don't use preemptible instances.|
-|==--skip-schemas==|Skip loading of extension schemas (the $schemas section).|
+|==--copy-deps==|         Copy dependencies into the destination project.|
+|==--no-copy-deps==|      Leave dependencies where they are.|
+|==--skip-schemas==|      Skip loading of schemas|
  |==--trash-intermediate==|Immediately trash intermediate outputs on workflow success.|
  |==--no-trash-intermediate==|Do not trash intermediate outputs (default).|
  
diff --git a/doc/user/cwl/cwl-style.html.textile.liquid b/doc/user/cwl/cwl-style.html.textile.liquid

index 303ae37e9e94b98d5694cd8de5c71930ca6196ce..911c9ba5a539f1769178f6ca7984b34736aededa 100644 (file)
--- a/doc/user/cwl/cwl-style.html.textile.liquid
+++ b/doc/user/cwl/cwl-style.html.textile.liquid
@@ -172,7 +172,7 @@ Workflows should always provide @DockerRequirement@ in the @hints@ or @requireme
  
  h3. Build a reusable library of components
  
-Build a reusable library of components.  Share tool wrappers and subworkflows between projects.  Make use of and contribute to "community maintained workflows and tools":https://github.com/common-workflow-library and tool registries such as "Dockstore":http://dockstore.org .
+Share tool wrappers and subworkflows between projects.  Make use of and contribute to "community maintained workflows and tools":https://github.com/common-workflow-library and tool registries such as "Dockstore":http://dockstore.org .
  
  h3. Supply scripts as input parameters
  
@@ -208,7 +208,7 @@ h3. Getting the temporary and output directories
  
  You can get the designated temporary directory using @$(runtime.tmpdir)@ in your CWL file, or from the @$TMPDIR@ environment variable in your script.
  
-Similarly, you can get the designated output directory using $(runtime.outdir), or from the @HOME@ environment variable in your script.
+Similarly, you can get the designated output directory using @$(runtime.outdir)@, or from the @HOME@ environment variable in your script.
  
  h3. Specifying @ResourceRequirement@
  
@@ -234,3 +234,36 @@ steps:
          coresMin: 2
          tmpdirMin: 90000
  {% endcodeblock %}
+
+h3. Importing data into Keep
+
+You can use HTTP URLs as File input parameters and @arvados-cwl-runner@ will download them to Keep for you:
+
+{% codeblock as yaml %}
+fastq1:
+  class: File
+  location: https://example.com/genomes/sampleA_1.fastq
+fastq2:
+  class: File
+  location: https://example.com/genomes/sampleA_2.fastq
+{% endcodeblock %}
+
+Files are downloaded and stored in Keep collections with HTTP header information stored in metadata.  If a file was previously downloaded, @arvados-cwl-runner@ uses HTTP caching rules to decide if a file should be re-downloaded or not.
+
+The default behavior is to transfer the files on the client, prior to submitting the workflow run.  This guarantees the data is available when the workflow is submitted.  However, if data transfer is time consuming and you are submitting multiple workflow runs in a row, or the node submitting the workflow has limited bandwidth, you can use the @--defer-download@ option to have the data transfer performed by workflow runner process on a compute node, after the workflow is submitted.
+
+@arvados-cwl-runner@ provides two additional options to control caching behavior.
+
+* @--varying-url-params@ will ignore the listed URL query parameters from any HTTP URLs when checking if a URL has already been downloaded to Keep.
+* @--prefer-cached-downloads@ will search Keep for the previously downloaded URL and use that if found, without checking the upstream resource. This means changes in the upstream resource won't be detected, but it also means the workflow will not fail if the upstream resource becomes inaccessible.
+
+One use of this is to import files from "AWS S3 signed URLs":https://docs.aws.amazon.com/AmazonS3/latest/userguide/ShareObjectPreSignedURL.html
+
+Here is an example usage.  The use of @--varying-url-params=AWSAccessKeyId,Signature,Expires@ is especially relevant, this removes these parameters from the cached URL, which means that if a new signed URL for the same object is generated later, it can be found in the cache.
+
+{% codeblock as sh %}
+arvados-cwl-runner --defer-download \
+                   --varying-url-params=AWSAccessKeyId,Signature,Expires \
+                  --prefer-cached-downloads \
+                  workflow.cwl params.yml
+{% endcodeblock %}
diff --git a/lib/config/config.default.yml b/lib/config/config.default.yml

index 444398bc3303d8ef3a1b50563933781649717b19..f7c2beca3372f294bb16762d6f5366e7e989a84c 100644 (file)
--- a/lib/config/config.default.yml
+++ b/lib/config/config.default.yml
@@ -373,6 +373,18 @@ Clusters:
        # cluster.
        RoleGroupsVisibleToAll: true
  
+      # During each period, a log entry with event_type="activity"
+      # will be recorded for each user who is active during that
+      # period. The object_uuid attribute will indicate the user's
+      # UUID.
+      #
+      # Multiple log entries for the same user may be generated during
+      # a period if there are multiple controller processes or a
+      # controller process is restarted.
+      #
+      # Use 0 to disable activity logging.
+      ActivityLoggingPeriod: 24h
+
      AuditLogs:
        # Time to keep audit logs, in seconds. (An audit log is a row added
        # to the "logs" table in the PostgreSQL database each time an
@@ -866,16 +878,28 @@ Clusters:
        # by going through login again.
        IssueTrustedTokens: true
  
-      # When the token is returned to a client, the token itself may
-      # be restricted from viewing/creating other tokens based on whether
-      # the client is "trusted" or not.  The local Workbench1 and
-      # Workbench2 are trusted by default, but if this is a
-      # LoginCluster, you probably want to include the other Workbench
-      # instances in the federation in this list.
+      # Origins (scheme://host[:port]) of clients trusted to receive
+      # new tokens via login process.  The ExternalURLs of the local
+      # Workbench1 and Workbench2 are trusted implicitly and do not
+      # need to be listed here.  If this is a LoginCluster, you
+      # probably want to include the other Workbench instances in the
+      # federation in this list.
+      #
+      # Example:
+      #
+      # TrustedClients:
+      #   "https://workbench.other-cluster.example": {}
+      #   "https://workbench2.other-cluster.example": {}
        TrustedClients:
-        SAMPLE:
-          "https://workbench.federate1.example": {}
-          "https://workbench.federate2.example": {}
+        SAMPLE: {}
+
+      # Treat any origin whose host part is "localhost" or a private
+      # IP address (e.g., http://10.0.0.123:3000/) as if it were
+      # listed in TrustedClients.
+      #
+      # Intended only for test/development use. Not appropriate for
+      # production use.
+      TrustPrivateNetworks: false
  
      Git:
        # Path to git or gitolite-shell executable. Each authenticated
@@ -941,8 +965,15 @@ Clusters:
        # troubleshooting purposes.
        LogReuseDecisions: false
  
-      # Default value for keep_cache_ram of a container's runtime_constraints.
-      DefaultKeepCacheRAM: 268435456
+      # Default value for keep_cache_ram of a container's
+      # runtime_constraints.  Note: this gets added to the RAM request
+      # used to allocate a VM or submit an HPC job
+      DefaultKeepCacheRAM: 0
+
+      # Default value for keep_cache_disk of a container's
+      # runtime_constraints.  Note: this gets added to the disk
+      # request used to allocate a VM or submit an HPC job
+      DefaultKeepCacheDisk: 8589934592
  
        # Number of times a container can be unlocked before being
        # automatically cancelled.
@@ -1004,7 +1035,7 @@ Clusters:
  
        # Extra RAM to reserve on the node, in addition to
        # the amount specified in the container's RuntimeConstraints
-      ReserveExtraRAM: 256MiB
+      ReserveExtraRAM: 550MiB
  
        # Minimum time between two attempts to run the same container
        MinRetryPeriod: 0s
@@ -1059,12 +1090,16 @@ Clusters:
        LocalKeepLogsToContainerLog: none
  
        Logging:
-        # When you run the db:delete_old_container_logs task, it will find
-        # containers that have been finished for at least this many seconds,
+        # Periodically (see SweepInterval) Arvados will check for
+        # containers that have been finished for at least this long,
          # and delete their stdout, stderr, arv-mount, crunch-run, and
          # crunchstat logs from the logs table.
          MaxAge: 720h
  
+        # How often to delete cached log entries for finished
+        # containers (see MaxAge).
+        SweepInterval: 12h
+
          # These two settings control how frequently log events are flushed to the
          # database.  Log lines are buffered until either crunch_log_bytes_per_event
          # has been reached or crunch_log_seconds_between_events has elapsed since
@@ -1483,7 +1518,7 @@ Clusters:
            RaceWindow: 24h
            PrefixLength: 0
            # Use aws-s3-go (v2) instead of goamz
-          UseAWSS3v2Driver: false
+          UseAWSS3v2Driver: true
  
            # For S3 driver, potentially unsafe tuning parameter,
            # intentionally excluded from main documentation.
@@ -1704,6 +1739,10 @@ Clusters:
        # This feature is disabled when set to zero.
        IdleTimeout: 0s
  
+      # URL to a file that is a fragment of text or HTML which should
+      # be rendered in Workbench as a banner.
+      BannerURL: ""
+
        # Workbench welcome screen, this is HTML text that will be
        # incorporated directly onto the page.
        WelcomePageHTML: |
diff --git a/lib/config/export.go b/lib/config/export.go

index a55295d1268b7cc0829ec2fe5073eb276c5b4564..814fc6cd9b9dfc6ab0fbea0d9e29715236a906bd 100644 (file)
--- a/lib/config/export.go
+++ b/lib/config/export.go
@@ -121,6 +121,7 @@ var whitelist = map[string]bool{
         "Containers.CrunchRunArgumentsList":        false,
         "Containers.CrunchRunCommand":              false,
         "Containers.DefaultKeepCacheRAM":           true,
+       "Containers.DefaultKeepCacheDisk":          true,
         "Containers.DispatchPrivateKey":            false,
         "Containers.JobsAPI":                       true,
         "Containers.JobsAPI.Enable":                true,
@@ -193,6 +194,7 @@ var whitelist = map[string]bool{
         "Login.Test.Users":                                    false,
         "Login.TokenLifetime":                                 false,
         "Login.TrustedClients":                                false,
+       "Login.TrustPrivateNetworks":                          false,
         "Mail":                                                true,
         "Mail.EmailFrom":                                      false,
         "Mail.IssueReporterEmailFrom":                         false,
@@ -226,6 +228,7 @@ var whitelist = map[string]bool{
         "TLS.Key":                                             false,
         "Users":                                               true,
         "Users.ActivatedUsersAreVisibleToOthers":              false,
+       "Users.ActivityLoggingPeriod":                         false,
         "Users.AdminNotifierEmailFrom":                        false,
         "Users.AnonymousUserToken":                            true,
         "Users.AutoAdminFirstUser":                            false,
@@ -263,6 +266,7 @@ var whitelist = map[string]bool{
         "Workbench.ApplicationMimetypesWithViewIcon.*":        true,
         "Workbench.ArvadosDocsite":                            true,
         "Workbench.ArvadosPublicDataDocURL":                   true,
+       "Workbench.BannerURL":                                 true,
         "Workbench.DefaultOpenIdPrefix":                       false,
         "Workbench.DisableSharingURLsUI":                      true,
         "Workbench.EnableGettingStartedPopup":                 true,
diff --git a/lib/controller/dblock/dblock.go b/lib/controller/dblock/dblock.go

index 1a36822d5b7f91e81c5b0deb167a105a962b3dfb..ad2733abfa36df82c72c4aa3c7a6c090c6496efb 100644 (file)
--- a/lib/controller/dblock/dblock.go
+++ b/lib/controller/dblock/dblock.go
@@ -7,6 +7,8 @@ package dblock
  import (
         "context"
         "database/sql"
+       "fmt"
+       "net"
         "sync"
         "time"
  
@@ -15,8 +17,12 @@ import (
  )
  
  var (
-       TrashSweep = &DBLocker{key: 10001}
-       retryDelay = 5 * time.Second
+       TrashSweep         = &DBLocker{key: 10001}
+       ContainerLogSweep  = &DBLocker{key: 10002}
+       KeepBalanceService = &DBLocker{key: 10003} // keep-balance service in periodic-sweep loop
+       KeepBalanceActive  = &DBLocker{key: 10004} // keep-balance sweep in progress (either -once=true or service loop)
+       Dispatch           = &DBLocker{key: 10005} // any dispatcher running
+       retryDelay         = 5 * time.Second
  )
  
  // DBLocker uses pg_advisory_lock to maintain a cluster-wide lock for
@@ -30,8 +36,11 @@ type DBLocker struct {
  }
  
  // Lock acquires the advisory lock, waiting/reconnecting if needed.
-func (dbl *DBLocker) Lock(ctx context.Context, getdb func(context.Context) (*sqlx.DB, error)) {
-       logger := ctxlog.FromContext(ctx)
+//
+// Returns false if ctx is canceled before the lock is acquired.
+func (dbl *DBLocker) Lock(ctx context.Context, getdb func(context.Context) (*sqlx.DB, error)) bool {
+       logger := ctxlog.FromContext(ctx).WithField("ID", dbl.key)
+       var lastHeldBy string
         for ; ; time.Sleep(retryDelay) {
                 dbl.mtx.Lock()
                 if dbl.conn != nil {
@@ -40,55 +49,87 @@ func (dbl *DBLocker) Lock(ctx context.Context, getdb func(context.Context) (*sql
                         dbl.mtx.Unlock()
                         continue
                 }
+               if ctx.Err() != nil {
+                       dbl.mtx.Unlock()
+                       return false
+               }
                 db, err := getdb(ctx)
-               if err != nil {
-                       logger.WithError(err).Infof("error getting database pool")
+               if err == context.Canceled {
+                       dbl.mtx.Unlock()
+                       return false
+               } else if err != nil {
+                       logger.WithError(err).Info("error getting database pool")
                         dbl.mtx.Unlock()
                         continue
                 }
                 conn, err := db.Conn(ctx)
-               if err != nil {
+               if err == context.Canceled {
+                       dbl.mtx.Unlock()
+                       return false
+               } else if err != nil {
                         logger.WithError(err).Info("error getting database connection")
                         dbl.mtx.Unlock()
                         continue
                 }
                 var locked bool
                 err = conn.QueryRowContext(ctx, `SELECT pg_try_advisory_lock($1)`, dbl.key).Scan(&locked)
-               if err != nil {
-                       logger.WithError(err).Infof("error getting pg_try_advisory_lock %d", dbl.key)
+               if err == context.Canceled {
+                       return false
+               } else if err != nil {
+                       logger.WithError(err).Info("error getting pg_try_advisory_lock")
                         conn.Close()
                         dbl.mtx.Unlock()
                         continue
                 }
                 if !locked {
+                       var host string
+                       var port int
+                       err = conn.QueryRowContext(ctx, `SELECT client_addr, client_port FROM pg_stat_activity WHERE pid IN
+                               (SELECT pid FROM pg_locks
+                                WHERE locktype = $1 AND objid = $2)`, "advisory", dbl.key).Scan(&host, &port)
+                       if err != nil {
+                               logger.WithError(err).Info("error getting other client info")
+                       } else {
+                               heldBy := net.JoinHostPort(host, fmt.Sprintf("%d", port))
+                               if lastHeldBy != heldBy {
+                                       logger.WithField("DBClient", heldBy).Info("waiting for other process to release lock")
+                                       lastHeldBy = heldBy
+                               }
+                       }
                         conn.Close()
                         dbl.mtx.Unlock()
                         continue
                 }
-               logger.Debugf("acquired pg_advisory_lock %d", dbl.key)
+               logger.Debug("acquired pg_advisory_lock")
                 dbl.ctx, dbl.getdb, dbl.conn = ctx, getdb, conn
                 dbl.mtx.Unlock()
-               return
+               return true
         }
  }
  
  // Check confirms that the lock is still active (i.e., the session is
  // still alive), and re-acquires if needed. Panics if Lock is not
  // acquired first.
-func (dbl *DBLocker) Check() {
+//
+// Returns false if the context passed to Lock() is canceled before
+// the lock is confirmed or reacquired.
+func (dbl *DBLocker) Check() bool {
         dbl.mtx.Lock()
         err := dbl.conn.PingContext(dbl.ctx)
-       if err == nil {
-               ctxlog.FromContext(dbl.ctx).Debugf("pg_advisory_lock %d connection still alive", dbl.key)
+       if err == context.Canceled {
+               dbl.mtx.Unlock()
+               return false
+       } else if err == nil {
+               ctxlog.FromContext(dbl.ctx).WithField("ID", dbl.key).Debug("connection still alive")
                 dbl.mtx.Unlock()
-               return
+               return true
         }
         ctxlog.FromContext(dbl.ctx).WithError(err).Info("database connection ping failed")
         dbl.conn.Close()
         dbl.conn = nil
         ctx, getdb := dbl.ctx, dbl.getdb
         dbl.mtx.Unlock()
-       dbl.Lock(ctx, getdb)
+       return dbl.Lock(ctx, getdb)
  }
  
  func (dbl *DBLocker) Unlock() {
@@ -97,9 +138,9 @@ func (dbl *DBLocker) Unlock() {
         if dbl.conn != nil {
                 _, err := dbl.conn.ExecContext(context.Background(), `SELECT pg_advisory_unlock($1)`, dbl.key)
                 if err != nil {
-                       ctxlog.FromContext(dbl.ctx).WithError(err).Infof("error releasing pg_advisory_lock %d", dbl.key)
+                       ctxlog.FromContext(dbl.ctx).WithError(err).WithField("ID", dbl.key).Info("error releasing pg_advisory_lock")
                 } else {
-                       ctxlog.FromContext(dbl.ctx).Debugf("released pg_advisory_lock %d", dbl.key)
+                       ctxlog.FromContext(dbl.ctx).WithField("ID", dbl.key).Debug("released pg_advisory_lock")
                 }
                 dbl.conn.Close()
                 dbl.conn = nil
diff --git a/lib/controller/dblock/dblock_test.go b/lib/controller/dblock/dblock_test.go

new file mode 100644 (file)

index 0000000..b10b2a3
--- /dev/null
+++ b/lib/controller/dblock/dblock_test.go
@@ -0,0 +1,91 @@
+// Copyright (C) The Arvados Authors. All rights reserved.
+//
+// SPDX-License-Identifier: AGPL-3.0
+
+package dblock
+
+import (
+       "bytes"
+       "context"
+       "sync"
+       "testing"
+       "time"
+
+       "git.arvados.org/arvados.git/lib/config"
+       "git.arvados.org/arvados.git/sdk/go/arvados"
+       "git.arvados.org/arvados.git/sdk/go/arvadostest"
+       "git.arvados.org/arvados.git/sdk/go/ctxlog"
+       "github.com/jmoiron/sqlx"
+       "github.com/sirupsen/logrus"
+       check "gopkg.in/check.v1"
+)
+
+func Test(t *testing.T) {
+       check.TestingT(t)
+}
+
+var _ = check.Suite(&suite{})
+
+type suite struct {
+       cluster *arvados.Cluster
+       db      *sqlx.DB
+       getdb   func(context.Context) (*sqlx.DB, error)
+}
+
+var testLocker = &DBLocker{key: 999}
+
+func (s *suite) SetUpSuite(c *check.C) {
+       cfg, err := config.NewLoader(nil, ctxlog.TestLogger(c)).Load()
+       c.Assert(err, check.IsNil)
+       s.cluster, err = cfg.GetCluster("")
+       c.Assert(err, check.IsNil)
+       s.db = arvadostest.DB(c, s.cluster)
+       s.getdb = func(context.Context) (*sqlx.DB, error) { return s.db, nil }
+}
+
+func (s *suite) TestLock(c *check.C) {
+       retryDelay = 10 * time.Millisecond
+
+       var logbuf bytes.Buffer
+       logger := ctxlog.New(&logbuf, "text", "debug")
+       logger.Level = logrus.DebugLevel
+       ctx := ctxlog.Context(context.Background(), logger)
+       ctx, cancel := context.WithCancel(ctx)
+       defer cancel()
+       testLocker.Lock(ctx, s.getdb)
+       testLocker.Check()
+
+       lock2 := make(chan bool)
+       var wg sync.WaitGroup
+       defer wg.Wait()
+       wg.Add(1)
+       go func() {
+               defer wg.Done()
+               testLocker2 := &DBLocker{key: 999}
+               testLocker2.Lock(ctx, s.getdb)
+               close(lock2)
+               testLocker2.Check()
+               testLocker2.Unlock()
+       }()
+
+       // Second lock should wait for first to Unlock
+       select {
+       case <-time.After(time.Second / 10):
+               c.Check(logbuf.String(), check.Matches, `(?ms).*level=info.*DBClient="[^"]+:\d+".*ID=999.*`)
+       case <-lock2:
+               c.Log("double-lock")
+               c.Fail()
+       }
+
+       testLocker.Check()
+       testLocker.Unlock()
+
+       // Now the second lock should succeed within retryDelay
+       select {
+       case <-time.After(retryDelay * 2):
+               c.Log("timed out")
+               c.Fail()
+       case <-lock2:
+       }
+       c.Logf("%s", logbuf.String())
+}
diff --git a/lib/controller/federation.go b/lib/controller/federation.go

index e7d6e29b88c1f683f981a1ee5df2b53cf7c862af..93b8315a63be588a0b3e2e1b3182337e68defeff 100644 (file)
--- a/lib/controller/federation.go
+++ b/lib/controller/federation.go
@@ -142,7 +142,7 @@ type CurrentUser struct {
  // non-nil, true, nil -- if the token is valid
  func (h *Handler) validateAPItoken(req *http.Request, token string) (*CurrentUser, bool, error) {
         user := CurrentUser{Authorization: arvados.APIClientAuthorization{APIToken: token}}
-       db, err := h.db(req.Context())
+       db, err := h.dbConnector.GetDB(req.Context())
         if err != nil {
                 ctxlog.FromContext(req.Context()).WithError(err).Debugf("validateAPItoken(%s): database error", token)
                 return nil, false, err
@@ -179,7 +179,7 @@ func (h *Handler) validateAPItoken(req *http.Request, token string) (*CurrentUse
  }
  
  func (h *Handler) createAPItoken(req *http.Request, userUUID string, scopes []string) (*arvados.APIClientAuthorization, error) {
-       db, err := h.db(req.Context())
+       db, err := h.dbConnector.GetDB(req.Context())
         if err != nil {
                 return nil, err
         }
diff --git a/lib/controller/federation/conn.go b/lib/controller/federation/conn.go

index 89f68a5ef1848aab0579ace235a60c92a3c05879..03690af0264001ba37153ac88875837d6031c378 100644 (file)
--- a/lib/controller/federation/conn.go
+++ b/lib/controller/federation/conn.go
@@ -515,6 +515,26 @@ func (conn *Conn) LinkDelete(ctx context.Context, options arvados.DeleteOptions)
         return conn.chooseBackend(options.UUID).LinkDelete(ctx, options)
  }
  
+func (conn *Conn) LogCreate(ctx context.Context, options arvados.CreateOptions) (arvados.Log, error) {
+       return conn.chooseBackend(options.ClusterID).LogCreate(ctx, options)
+}
+
+func (conn *Conn) LogUpdate(ctx context.Context, options arvados.UpdateOptions) (arvados.Log, error) {
+       return conn.chooseBackend(options.UUID).LogUpdate(ctx, options)
+}
+
+func (conn *Conn) LogGet(ctx context.Context, options arvados.GetOptions) (arvados.Log, error) {
+       return conn.chooseBackend(options.UUID).LogGet(ctx, options)
+}
+
+func (conn *Conn) LogList(ctx context.Context, options arvados.ListOptions) (arvados.LogList, error) {
+       return conn.generated_LogList(ctx, options)
+}
+
+func (conn *Conn) LogDelete(ctx context.Context, options arvados.DeleteOptions) (arvados.Log, error) {
+       return conn.chooseBackend(options.UUID).LogDelete(ctx, options)
+}
+
  func (conn *Conn) SpecimenList(ctx context.Context, options arvados.ListOptions) (arvados.SpecimenList, error) {
         return conn.generated_SpecimenList(ctx, options)
  }
diff --git a/lib/controller/federation/generate.go b/lib/controller/federation/generate.go

index 8af61315643708aaa96466286275452d3c242edb..86bbf9d9e3fcd991b0020f0a2332a25eb16c9108 100644 (file)
--- a/lib/controller/federation/generate.go
+++ b/lib/controller/federation/generate.go
@@ -53,7 +53,7 @@ func main() {
                 defer out.Close()
                 out.Write(regexp.MustCompile(`(?ms)^.*package .*?import.*?\n\)\n`).Find(buf))
                 io.WriteString(out, "//\n// -- this file is auto-generated -- do not edit -- edit list.go and run \"go generate\" instead --\n//\n\n")
-               for _, t := range []string{"Container", "ContainerRequest", "Group", "Specimen", "User", "Link", "APIClientAuthorization"} {
+               for _, t := range []string{"Container", "ContainerRequest", "Group", "Specimen", "User", "Link", "Log", "APIClientAuthorization"} {
                         _, err := out.Write(bytes.ReplaceAll(orig, []byte("Collection"), []byte(t)))
                         if err != nil {
                                 panic(err)
diff --git a/lib/controller/federation/generated.go b/lib/controller/federation/generated.go

index 66f36161d50817743ba25853fe1aadd637f84bdc..637a1ce9194953aeff865a0cd3f86dad13ba1068 100755 (executable)
--- a/lib/controller/federation/generated.go
+++ b/lib/controller/federation/generated.go
@@ -263,6 +263,47 @@ func (conn *Conn) generated_LinkList(ctx context.Context, options arvados.ListOp
         return merged, err
  }
  
+func (conn *Conn) generated_LogList(ctx context.Context, options arvados.ListOptions) (arvados.LogList, error) {
+       var mtx sync.Mutex
+       var merged arvados.LogList
+       var needSort atomic.Value
+       needSort.Store(false)
+       err := conn.splitListRequest(ctx, options, func(ctx context.Context, _ string, backend arvados.API, options arvados.ListOptions) ([]string, error) {
+               options.ForwardedFor = conn.cluster.ClusterID + "-" + options.ForwardedFor
+               cl, err := backend.LogList(ctx, options)
+               if err != nil {
+                       return nil, err
+               }
+               mtx.Lock()
+               defer mtx.Unlock()
+               if len(merged.Items) == 0 {
+                       merged = cl
+               } else if len(cl.Items) > 0 {
+                       merged.Items = append(merged.Items, cl.Items...)
+                       needSort.Store(true)
+               }
+               uuids := make([]string, 0, len(cl.Items))
+               for _, item := range cl.Items {
+                       uuids = append(uuids, item.UUID)
+               }
+               return uuids, nil
+       })
+       if needSort.Load().(bool) {
+               // Apply the default/implied order, "modified_at desc"
+               sort.Slice(merged.Items, func(i, j int) bool {
+                       mi, mj := merged.Items[i].ModifiedAt, merged.Items[j].ModifiedAt
+                       return mj.Before(mi)
+               })
+       }
+       if merged.Items == nil {
+               // Return empty results as [], not null
+               // (https://github.com/golang/go/issues/27589 might be
+               // a better solution in the future)
+               merged.Items = []arvados.Log{}
+       }
+       return merged, err
+}
+
  func (conn *Conn) generated_APIClientAuthorizationList(ctx context.Context, options arvados.ListOptions) (arvados.APIClientAuthorizationList, error) {
         var mtx sync.Mutex
         var merged arvados.APIClientAuthorizationList
diff --git a/lib/controller/federation/list.go b/lib/controller/federation/list.go

index 039caac574e479bdad181dfeed745dd3255640cf..329066d1dcf767ecb03ae13d803858ff715747a0 100644 (file)
--- a/lib/controller/federation/list.go
+++ b/lib/controller/federation/list.go
@@ -65,13 +65,13 @@ func (conn *Conn) generated_CollectionList(ctx context.Context, options arvados.
  // Call fn on one or more local/remote backends if opts indicates a
  // federation-wide list query, i.e.:
  //
-// * There is at least one filter of the form
-//   ["uuid","in",[a,b,c,...]] or ["uuid","=",a]
+//   - There is at least one filter of the form
+//     ["uuid","in",[a,b,c,...]] or ["uuid","=",a]
  //
-// * One or more of the supplied UUIDs (a,b,c,...) has a non-local
-//   prefix.
+//   - One or more of the supplied UUIDs (a,b,c,...) has a non-local
+//     prefix.
  //
-// * There are no other filters
+//   - There are no other filters
  //
  // (If opts doesn't indicate a federation-wide list query, fn is just
  // called once with the local backend.)
@@ -79,29 +79,29 @@ func (conn *Conn) generated_CollectionList(ctx context.Context, options arvados.
  // fn is called more than once only if the query meets the following
  // restrictions:
  //
-// * Count=="none"
+//   - Count=="none"
  //
-// * Limit<0
+//   - Limit<0
  //
-// * len(Order)==0
+//   - len(Order)==0
  //
-// * Each filter is either "uuid = ..." or "uuid in [...]".
+//   - Each filter is either "uuid = ..." or "uuid in [...]".
  //
-// * The maximum possible response size (total number of objects that
-//   could potentially be matched by all of the specified filters)
-//   exceeds the local cluster's response page size limit.
+//   - The maximum possible response size (total number of objects
+//     that could potentially be matched by all of the specified
+//     filters) exceeds the local cluster's response page size limit.
  //
  // If the query involves multiple backends but doesn't meet these
  // restrictions, an error is returned without calling fn.
  //
  // Thus, the caller can assume that either:
  //
-// * splitListRequest() returns an error, or
+//   - splitListRequest() returns an error, or
  //
-// * fn is called exactly once, or
+//   - fn is called exactly once, or
  //
-// * fn is called more than once, with options that satisfy the above
-//   restrictions.
+//   - fn is called more than once, with options that satisfy the above
+//     restrictions.
  //
  // Each call to fn indicates a single (local or remote) backend and a
  // corresponding options argument suitable for sending to that
diff --git a/lib/controller/federation/login_test.go b/lib/controller/federation/login_test.go

index c05ebfce69820b3be781a3d18be8a591aaa94eb2..e1114bf7eb21fd6752598ee7f31fe08199f9ef74 100644 (file)
--- a/lib/controller/federation/login_test.go
+++ b/lib/controller/federation/login_test.go
@@ -41,25 +41,27 @@ func (s *LoginSuite) TestDeferToLoginCluster(c *check.C) {
  }
  
  func (s *LoginSuite) TestLogout(c *check.C) {
+       otherOrigin := arvados.URL{Scheme: "https", Host: "app.example.com", Path: "/"}
+       otherURL := "https://app.example.com/foo"
         s.cluster.Services.Workbench1.ExternalURL = arvados.URL{Scheme: "https", Host: "workbench1.example.com"}
         s.cluster.Services.Workbench2.ExternalURL = arvados.URL{Scheme: "https", Host: "workbench2.example.com"}
+       s.cluster.Login.TrustedClients = map[arvados.URL]struct{}{otherOrigin: {}}
         s.addHTTPRemote(c, "zhome", &arvadostest.APIStub{})
         s.cluster.Login.LoginCluster = "zhome"
         // s.fed is already set by SetUpTest, but we need to
         // reinitialize with the above config changes.
         s.fed = New(s.cluster, nil)
  
-       returnTo := "https://app.example.com/foo?bar"
         for _, trial := range []struct {
                 token    string
                 returnTo string
                 target   string
         }{
                 {token: "", returnTo: "", target: s.cluster.Services.Workbench2.ExternalURL.String()},
-               {token: "", returnTo: returnTo, target: returnTo},
-               {token: "zzzzzzzzzzzzzzzzzzzzz", returnTo: returnTo, target: returnTo},
-               {token: "v2/zzzzz-aaaaa-aaaaaaaaaaaaaaa/aaaaaaaaaaaaaaaaaaaaaaaaaaaaaa", returnTo: returnTo, target: returnTo},
-               {token: "v2/zhome-aaaaa-aaaaaaaaaaaaaaa/aaaaaaaaaaaaaaaaaaaaaaaaaaaaaa", returnTo: returnTo, target: "http://" + s.cluster.RemoteClusters["zhome"].Host + "/logout?" + url.Values{"return_to": {returnTo}}.Encode()},
+               {token: "", returnTo: otherURL, target: otherURL},
+               {token: "zzzzzzzzzzzzzzzzzzzzz", returnTo: otherURL, target: otherURL},
+               {token: "v2/zzzzz-aaaaa-aaaaaaaaaaaaaaa/aaaaaaaaaaaaaaaaaaaaaaaaaaaaaa", returnTo: otherURL, target: otherURL},
+               {token: "v2/zhome-aaaaa-aaaaaaaaaaaaaaa/aaaaaaaaaaaaaaaaaaaaaaaaaaaaaa", returnTo: otherURL, target: "http://" + s.cluster.RemoteClusters["zhome"].Host + "/logout?" + url.Values{"return_to": {otherURL}}.Encode()},
         } {
                 c.Logf("trial %#v", trial)
                 ctx := s.ctx
diff --git a/lib/controller/handler.go b/lib/controller/handler.go

index 665fd5c636372fc4a21bd7de68c5d886aafbcc7c..4c6fca7f77276c3981c591d18429d8520d3e76b7 100644 (file)
--- a/lib/controller/handler.go
+++ b/lib/controller/handler.go
@@ -6,7 +6,6 @@ package controller
  
  import (
         "context"
-       "errors"
         "fmt"
         "net/http"
         "net/http/httptest"
@@ -21,10 +20,8 @@ import (
         "git.arvados.org/arvados.git/lib/controller/router"
         "git.arvados.org/arvados.git/lib/ctrlctx"
         "git.arvados.org/arvados.git/sdk/go/arvados"
-       "git.arvados.org/arvados.git/sdk/go/ctxlog"
         "git.arvados.org/arvados.git/sdk/go/health"
         "git.arvados.org/arvados.git/sdk/go/httpserver"
-       "github.com/jmoiron/sqlx"
  
         // sqlx needs lib/pq to talk to PostgreSQL
         _ "github.com/lib/pq"
@@ -40,8 +37,7 @@ type Handler struct {
         proxy          *proxy
         secureClient   *http.Client
         insecureClient *http.Client
-       pgdb           *sqlx.DB
-       pgdbMtx        sync.Mutex
+       dbConnector    ctrlctx.DBConnector
  }
  
  func (h *Handler) ServeHTTP(w http.ResponseWriter, req *http.Request) {
@@ -65,7 +61,7 @@ func (h *Handler) ServeHTTP(w http.ResponseWriter, req *http.Request) {
  
  func (h *Handler) CheckHealth() error {
         h.setupOnce.Do(h.setup)
-       _, err := h.db(context.TODO())
+       _, err := h.dbConnector.GetDB(context.TODO())
         if err != nil {
                 return err
         }
@@ -97,14 +93,18 @@ func (h *Handler) setup() {
         mux := http.NewServeMux()
         healthFuncs := make(map[string]health.Func)
  
-       oidcAuthorizer := localdb.OIDCAccessTokenAuthorizer(h.Cluster, h.db)
+       h.dbConnector = ctrlctx.DBConnector{PostgreSQL: h.Cluster.PostgreSQL}
+       oidcAuthorizer := localdb.OIDCAccessTokenAuthorizer(h.Cluster, h.dbConnector.GetDB)
         h.federation = federation.New(h.Cluster, &healthFuncs)
         rtr := router.New(h.federation, router.Config{
                 MaxRequestSize: h.Cluster.API.MaxRequestSize,
-               WrapCalls:      api.ComposeWrappers(ctrlctx.WrapCallsInTransactions(h.db), oidcAuthorizer.WrapCalls),
+               WrapCalls: api.ComposeWrappers(
+                       ctrlctx.WrapCallsInTransactions(h.dbConnector.GetDB),
+                       oidcAuthorizer.WrapCalls,
+                       ctrlctx.WrapCallsWithAuth(h.Cluster)),
         })
  
-       healthRoutes := health.Routes{"ping": func() error { _, err := h.db(context.TODO()); return err }}
+       healthRoutes := health.Routes{"ping": func() error { _, err := h.dbConnector.GetDB(context.TODO()); return err }}
         for name, f := range healthFuncs {
                 healthRoutes[name] = f
         }
@@ -152,31 +152,7 @@ func (h *Handler) setup() {
         }
  
         go h.trashSweepWorker()
-}
-
-var errDBConnection = errors.New("database connection error")
-
-func (h *Handler) db(ctx context.Context) (*sqlx.DB, error) {
-       h.pgdbMtx.Lock()
-       defer h.pgdbMtx.Unlock()
-       if h.pgdb != nil {
-               return h.pgdb, nil
-       }
-
-       db, err := sqlx.Open("postgres", h.Cluster.PostgreSQL.Connection.String())
-       if err != nil {
-               ctxlog.FromContext(ctx).WithError(err).Error("postgresql connect failed")
-               return nil, errDBConnection
-       }
-       if p := h.Cluster.PostgreSQL.ConnectionPool; p > 0 {
-               db.SetMaxOpenConns(p)
-       }
-       if err := db.Ping(); err != nil {
-               ctxlog.FromContext(ctx).WithError(err).Error("postgresql connect succeeded but ping failed")
-               return nil, errDBConnection
-       }
-       h.pgdb = db
-       return db, nil
+       go h.containerLogSweepWorker()
  }
  
  type middlewareFunc func(http.ResponseWriter, *http.Request, http.Handler)
diff --git a/lib/controller/handler_test.go b/lib/controller/handler_test.go

index 39c2b1c68e5c82921e10bc9125d54e17846a8fed..1af3ba3626c94dc517fd657270a24ed067eaace5 100644 (file)
--- a/lib/controller/handler_test.go
+++ b/lib/controller/handler_test.go
@@ -19,6 +19,7 @@ import (
         "testing"
         "time"
  
+       "git.arvados.org/arvados.git/lib/controller/rpc"
         "git.arvados.org/arvados.git/sdk/go/arvados"
         "git.arvados.org/arvados.git/sdk/go/arvadostest"
         "git.arvados.org/arvados.git/sdk/go/auth"
@@ -271,18 +272,20 @@ func (s *HandlerSuite) TestProxyNotFound(c *check.C) {
  }
  
  func (s *HandlerSuite) TestLogoutGoogle(c *check.C) {
+       s.cluster.Services.Workbench2.ExternalURL = arvados.URL{Scheme: "https", Host: "wb2.example", Path: "/"}
         s.cluster.Login.Google.Enable = true
         s.cluster.Login.Google.ClientID = "test"
-       req := httptest.NewRequest("GET", "https://0.0.0.0:1/logout?return_to=https://example.com/foo", nil)
+       req := httptest.NewRequest("GET", "https://0.0.0.0:1/logout?return_to=https://wb2.example/", nil)
         resp := httptest.NewRecorder()
         s.handler.ServeHTTP(resp, req)
         if !c.Check(resp.Code, check.Equals, http.StatusFound) {
                 c.Log(resp.Body.String())
         }
-       c.Check(resp.Header().Get("Location"), check.Equals, "https://example.com/foo")
+       c.Check(resp.Header().Get("Location"), check.Equals, "https://wb2.example/")
  }
  
  func (s *HandlerSuite) TestValidateV1APIToken(c *check.C) {
+       c.Assert(s.handler.CheckHealth(), check.IsNil)
         req := httptest.NewRequest("GET", "/arvados/v1/users/current", nil)
         user, ok, err := s.handler.validateAPItoken(req, arvadostest.ActiveToken)
         c.Assert(err, check.IsNil)
@@ -294,6 +297,7 @@ func (s *HandlerSuite) TestValidateV1APIToken(c *check.C) {
  }
  
  func (s *HandlerSuite) TestValidateV2APIToken(c *check.C) {
+       c.Assert(s.handler.CheckHealth(), check.IsNil)
         req := httptest.NewRequest("GET", "/arvados/v1/users/current", nil)
         user, ok, err := s.handler.validateAPItoken(req, arvadostest.ActiveTokenV2)
         c.Assert(err, check.IsNil)
@@ -336,6 +340,7 @@ func (s *HandlerSuite) TestLogTokenUUID(c *check.C) {
  }
  
  func (s *HandlerSuite) TestCreateAPIToken(c *check.C) {
+       c.Assert(s.handler.CheckHealth(), check.IsNil)
         req := httptest.NewRequest("GET", "/arvados/v1/users/current", nil)
         auth, err := s.handler.createAPItoken(req, arvadostest.ActiveUserUUID, nil)
         c.Assert(err, check.IsNil)
@@ -476,7 +481,7 @@ func (s *HandlerSuite) TestTrashSweep(c *check.C) {
         coll, err := s.handler.federation.CollectionCreate(ctx, arvados.CreateOptions{Attrs: map[string]interface{}{"name": "test trash sweep"}, EnsureUniqueName: true})
         c.Assert(err, check.IsNil)
         defer s.handler.federation.CollectionDelete(ctx, arvados.DeleteOptions{UUID: coll.UUID})
-       db, err := s.handler.db(s.ctx)
+       db, err := s.handler.dbConnector.GetDB(s.ctx)
         c.Assert(err, check.IsNil)
         _, err = db.ExecContext(s.ctx, `update collections set trash_at = $1, delete_at = $2 where uuid = $3`, time.Now().UTC().Add(time.Second/10), time.Now().UTC().Add(time.Hour), coll.UUID)
         c.Assert(err, check.IsNil)
@@ -494,3 +499,67 @@ func (s *HandlerSuite) TestTrashSweep(c *check.C) {
                 time.Sleep(time.Second / 10)
         }
  }
+
+func (s *HandlerSuite) TestContainerLogSweep(c *check.C) {
+       s.cluster.SystemRootToken = arvadostest.SystemRootToken
+       s.cluster.Containers.Logging.SweepInterval = arvados.Duration(time.Second / 10)
+       s.handler.CheckHealth()
+       ctx := auth.NewContext(s.ctx, &auth.Credentials{Tokens: []string{arvadostest.ActiveTokenV2}})
+       logentry, err := s.handler.federation.LogCreate(ctx, arvados.CreateOptions{Attrs: map[string]interface{}{
+               "object_uuid": arvadostest.CompletedContainerUUID,
+               "event_type":  "stderr",
+               "properties": map[string]interface{}{
+                       "text": "test trash sweep\n",
+               },
+       }})
+       c.Assert(err, check.IsNil)
+       defer s.handler.federation.LogDelete(ctx, arvados.DeleteOptions{UUID: logentry.UUID})
+       deadline := time.Now().Add(5 * time.Second)
+       for {
+               if time.Now().After(deadline) {
+                       c.Log("timed out")
+                       c.FailNow()
+               }
+               logentries, err := s.handler.federation.LogList(ctx, arvados.ListOptions{Filters: []arvados.Filter{{"uuid", "=", logentry.UUID}}, Limit: -1})
+               c.Assert(err, check.IsNil)
+               if len(logentries.Items) == 0 {
+                       break
+               }
+               time.Sleep(time.Second / 10)
+       }
+}
+
+func (s *HandlerSuite) TestLogActivity(c *check.C) {
+       s.cluster.SystemRootToken = arvadostest.SystemRootToken
+       s.cluster.Users.ActivityLoggingPeriod = arvados.Duration(24 * time.Hour)
+       s.handler.CheckHealth()
+
+       testServer := newServerFromIntegrationTestEnv(c)
+       testServer.Server.Handler = httpserver.AddRequestIDs(httpserver.LogRequests(s.handler))
+       c.Assert(testServer.Start(), check.IsNil)
+       defer testServer.Close()
+
+       u, _ := url.Parse("http://" + testServer.Addr)
+       client := rpc.NewConn(s.cluster.ClusterID, u, true, rpc.PassthroughTokenProvider)
+
+       starttime := time.Now()
+       for i := 0; i < 4; i++ {
+               for _, token := range []string{
+                       arvadostest.ActiveTokenV2,
+                       arvadostest.ActiveToken,
+                       arvadostest.SpectatorToken,
+               } {
+                       ctx := auth.NewContext(s.ctx, &auth.Credentials{Tokens: []string{token}})
+                       _, err := client.CollectionList(ctx, arvados.ListOptions{})
+                       c.Assert(err, check.IsNil)
+               }
+       }
+       db, err := s.handler.dbConnector.GetDB(s.ctx)
+       c.Assert(err, check.IsNil)
+       for _, userUUID := range []string{arvadostest.ActiveUserUUID, arvadostest.SpectatorUserUUID} {
+               var rows int
+               err = db.QueryRowContext(s.ctx, `select count(uuid) from logs where object_uuid = $1 and event_at > $2`, arvadostest.ActiveUserUUID, starttime.UTC()).Scan(&rows)
+               c.Assert(err, check.IsNil)
+               c.Check(rows, check.Equals, 1, check.Commentf("expect 1 row for user uuid %s", userUUID))
+       }
+}
diff --git a/lib/controller/localdb/collection.go b/lib/controller/localdb/collection.go

index 868e466e9e281bf7f4f5eaf8b4f7a530956653cf..581595e5e3818a56b4194adc47834e87035a3ce8 100644 (file)
--- a/lib/controller/localdb/collection.go
+++ b/lib/controller/localdb/collection.go
@@ -22,6 +22,7 @@ import (
  // CollectionGet defers to railsProxy for everything except blob
  // signatures.
  func (conn *Conn) CollectionGet(ctx context.Context, opts arvados.GetOptions) (arvados.Collection, error) {
+       conn.logActivity(ctx)
         if len(opts.Select) > 0 {
                 // We need to know IsTrashed and TrashAt to implement
                 // signing properly, even if the caller doesn't want
@@ -39,6 +40,7 @@ func (conn *Conn) CollectionGet(ctx context.Context, opts arvados.GetOptions) (a
  // CollectionList defers to railsProxy for everything except blob
  // signatures.
  func (conn *Conn) CollectionList(ctx context.Context, opts arvados.ListOptions) (arvados.CollectionList, error) {
+       conn.logActivity(ctx)
         if len(opts.Select) > 0 {
                 // We need to know IsTrashed and TrashAt to implement
                 // signing properly, even if the caller doesn't want
@@ -58,6 +60,7 @@ func (conn *Conn) CollectionList(ctx context.Context, opts arvados.ListOptions)
  // CollectionCreate defers to railsProxy for everything except blob
  // signatures and vocabulary checking.
  func (conn *Conn) CollectionCreate(ctx context.Context, opts arvados.CreateOptions) (arvados.Collection, error) {
+       conn.logActivity(ctx)
         err := conn.checkProperties(ctx, opts.Attrs["properties"])
         if err != nil {
                 return arvados.Collection{}, err
@@ -82,6 +85,7 @@ func (conn *Conn) CollectionCreate(ctx context.Context, opts arvados.CreateOptio
  // CollectionUpdate defers to railsProxy for everything except blob
  // signatures and vocabulary checking.
  func (conn *Conn) CollectionUpdate(ctx context.Context, opts arvados.UpdateOptions) (arvados.Collection, error) {
+       conn.logActivity(ctx)
         err := conn.checkProperties(ctx, opts.Attrs["properties"])
         if err != nil {
                 return arvados.Collection{}, err
diff --git a/lib/controller/localdb/conn.go b/lib/controller/localdb/conn.go

index a36822ad6b1f5df1f73ffbc3536d76a7215f1817..5b6964de00d105ec89938e3c2f4e556688fd4722 100644 (file)
--- a/lib/controller/localdb/conn.go
+++ b/lib/controller/localdb/conn.go
@@ -8,9 +8,9 @@ import (
         "context"
         "encoding/json"
         "fmt"
+       "net"
         "net/http"
         "os"
-       "strings"
         "sync"
         "time"
  
@@ -33,8 +33,11 @@ type Conn struct {
         lastVocabularyRefreshCheck time.Time
         lastVocabularyError        error
         loginController
-       gwTunnels     map[string]*yamux.Session
-       gwTunnelsLock sync.Mutex
+       gwTunnels        map[string]*yamux.Session
+       gwTunnelsLock    sync.Mutex
+       activeUsers      map[string]bool
+       activeUsersLock  sync.Mutex
+       activeUsersReset time.Time
  }
  
  func NewConn(cluster *arvados.Cluster) *Conn {
@@ -163,53 +166,25 @@ func (conn *Conn) UserAuthenticate(ctx context.Context, opts arvados.UserAuthent
         return conn.loginController.UserAuthenticate(ctx, opts)
  }
  
-func (conn *Conn) GroupContents(ctx context.Context, options arvados.GroupContentsOptions) (arvados.ObjectList, error) {
-       // The requested UUID can be a user (virtual home project), which we just pass on to
-       // the API server.
-       if strings.Index(options.UUID, "-j7d0g-") != 5 {
-               return conn.railsProxy.GroupContents(ctx, options)
-       }
-
-       var resp arvados.ObjectList
-
-       // Get the group object
-       respGroup, err := conn.GroupGet(ctx, arvados.GetOptions{UUID: options.UUID})
-       if err != nil {
-               return resp, err
-       }
-
-       // If the group has groupClass 'filter', apply the filters before getting the contents.
-       if respGroup.GroupClass == "filter" {
-               if filters, ok := respGroup.Properties["filters"].([]interface{}); ok {
-                       for _, f := range filters {
-                               // f is supposed to be a []string
-                               tmp, ok2 := f.([]interface{})
-                               if !ok2 || len(tmp) < 3 {
-                                       return resp, fmt.Errorf("filter unparsable: %T, %+v, original field: %T, %+v\n", tmp, tmp, f, f)
-                               }
-                               var filter arvados.Filter
-                               if attr, ok2 := tmp[0].(string); ok2 {
-                                       filter.Attr = attr
-                               } else {
-                                       return resp, fmt.Errorf("filter unparsable: attribute must be string: %T, %+v, filter: %T, %+v\n", tmp[0], tmp[0], f, f)
-                               }
-                               if operator, ok2 := tmp[1].(string); ok2 {
-                                       filter.Operator = operator
-                               } else {
-                                       return resp, fmt.Errorf("filter unparsable: operator must be string: %T, %+v, filter: %T, %+v\n", tmp[1], tmp[1], f, f)
-                               }
-                               filter.Operand = tmp[2]
-                               options.Filters = append(options.Filters, filter)
-                       }
-               } else {
-                       return resp, fmt.Errorf("filter unparsable: not an array\n")
+var privateNetworks = func() (nets []*net.IPNet) {
+       for _, s := range []string{
+               "127.0.0.0/8",
+               "10.0.0.0/8",
+               "172.16.0.0/12",
+               "192.168.0.0/16",
+               "169.254.0.0/16",
+               "::1/128",
+               "fe80::/10",
+               "fc00::/7",
+       } {
+               _, n, err := net.ParseCIDR(s)
+               if err != nil {
+                       panic(fmt.Sprintf("privateNetworks: %q: %s", s, err))
                 }
-               // Use the generic /groups/contents endpoint for filter groups
-               options.UUID = ""
+               nets = append(nets, n)
         }
-
-       return conn.railsProxy.GroupContents(ctx, options)
-}
+       return
+}()
  
  func httpErrorf(code int, format string, args ...interface{}) error {
         return httpserver.ErrorWithStatus(fmt.Errorf(format, args...), code)
diff --git a/lib/controller/localdb/container_request.go b/lib/controller/localdb/container_request.go

index 5b2ce95da99c2c8195ce2ceac6aaa925a75d2e0f..49e21840ea206f69684738e2f9aec98f0f6c2fd3 100644 (file)
--- a/lib/controller/localdb/container_request.go
+++ b/lib/controller/localdb/container_request.go
@@ -13,6 +13,7 @@ import (
  // ContainerRequestCreate defers to railsProxy for everything except
  // vocabulary checking.
  func (conn *Conn) ContainerRequestCreate(ctx context.Context, opts arvados.CreateOptions) (arvados.ContainerRequest, error) {
+       conn.logActivity(ctx)
         err := conn.checkProperties(ctx, opts.Attrs["properties"])
         if err != nil {
                 return arvados.ContainerRequest{}, err
@@ -27,6 +28,7 @@ func (conn *Conn) ContainerRequestCreate(ctx context.Context, opts arvados.Creat
  // ContainerRequestUpdate defers to railsProxy for everything except
  // vocabulary checking.
  func (conn *Conn) ContainerRequestUpdate(ctx context.Context, opts arvados.UpdateOptions) (arvados.ContainerRequest, error) {
+       conn.logActivity(ctx)
         err := conn.checkProperties(ctx, opts.Attrs["properties"])
         if err != nil {
                 return arvados.ContainerRequest{}, err
@@ -37,3 +39,18 @@ func (conn *Conn) ContainerRequestUpdate(ctx context.Context, opts arvados.Updat
         }
         return resp, nil
  }
+
+func (conn *Conn) ContainerRequestGet(ctx context.Context, opts arvados.GetOptions) (arvados.ContainerRequest, error) {
+       conn.logActivity(ctx)
+       return conn.railsProxy.ContainerRequestGet(ctx, opts)
+}
+
+func (conn *Conn) ContainerRequestList(ctx context.Context, opts arvados.ListOptions) (arvados.ContainerRequestList, error) {
+       conn.logActivity(ctx)
+       return conn.railsProxy.ContainerRequestList(ctx, opts)
+}
+
+func (conn *Conn) ContainerRequestDelete(ctx context.Context, opts arvados.DeleteOptions) (arvados.ContainerRequest, error) {
+       conn.logActivity(ctx)
+       return conn.railsProxy.ContainerRequestDelete(ctx, opts)
+}
diff --git a/lib/controller/localdb/group.go b/lib/controller/localdb/group.go

index 0d77bdbd9ce792a28ba436ae05ba95bc7d1ce0f0..418fd6b8b7ec5bcc955c62c0d1207b66284d587b 100644 (file)
--- a/lib/controller/localdb/group.go
+++ b/lib/controller/localdb/group.go
@@ -6,6 +6,8 @@ package localdb
  
  import (
         "context"
+       "fmt"
+       "strings"
  
         "git.arvados.org/arvados.git/sdk/go/arvados"
  )
@@ -13,6 +15,7 @@ import (
  // GroupCreate defers to railsProxy for everything except vocabulary
  // checking.
  func (conn *Conn) GroupCreate(ctx context.Context, opts arvados.CreateOptions) (arvados.Group, error) {
+       conn.logActivity(ctx)
         err := conn.checkProperties(ctx, opts.Attrs["properties"])
         if err != nil {
                 return arvados.Group{}, err
@@ -24,9 +27,15 @@ func (conn *Conn) GroupCreate(ctx context.Context, opts arvados.CreateOptions) (
         return resp, nil
  }
  
+func (conn *Conn) GroupGet(ctx context.Context, opts arvados.GetOptions) (arvados.Group, error) {
+       conn.logActivity(ctx)
+       return conn.railsProxy.GroupGet(ctx, opts)
+}
+
  // GroupUpdate defers to railsProxy for everything except vocabulary
  // checking.
  func (conn *Conn) GroupUpdate(ctx context.Context, opts arvados.UpdateOptions) (arvados.Group, error) {
+       conn.logActivity(ctx)
         err := conn.checkProperties(ctx, opts.Attrs["properties"])
         if err != nil {
                 return arvados.Group{}, err
@@ -37,3 +46,63 @@ func (conn *Conn) GroupUpdate(ctx context.Context, opts arvados.UpdateOptions) (
         }
         return resp, nil
  }
+
+func (conn *Conn) GroupList(ctx context.Context, opts arvados.ListOptions) (arvados.GroupList, error) {
+       conn.logActivity(ctx)
+       return conn.railsProxy.GroupList(ctx, opts)
+}
+
+func (conn *Conn) GroupDelete(ctx context.Context, opts arvados.DeleteOptions) (arvados.Group, error) {
+       conn.logActivity(ctx)
+       return conn.railsProxy.GroupDelete(ctx, opts)
+}
+
+func (conn *Conn) GroupContents(ctx context.Context, options arvados.GroupContentsOptions) (arvados.ObjectList, error) {
+       conn.logActivity(ctx)
+
+       // The requested UUID can be a user (virtual home project), which we just pass on to
+       // the API server.
+       if strings.Index(options.UUID, "-j7d0g-") != 5 {
+               return conn.railsProxy.GroupContents(ctx, options)
+       }
+
+       var resp arvados.ObjectList
+
+       // Get the group object
+       respGroup, err := conn.GroupGet(ctx, arvados.GetOptions{UUID: options.UUID})
+       if err != nil {
+               return resp, err
+       }
+
+       // If the group has groupClass 'filter', apply the filters before getting the contents.
+       if respGroup.GroupClass == "filter" {
+               if filters, ok := respGroup.Properties["filters"].([]interface{}); ok {
+                       for _, f := range filters {
+                               // f is supposed to be a []string
+                               tmp, ok2 := f.([]interface{})
+                               if !ok2 || len(tmp) < 3 {
+                                       return resp, fmt.Errorf("filter unparsable: %T, %+v, original field: %T, %+v\n", tmp, tmp, f, f)
+                               }
+                               var filter arvados.Filter
+                               if attr, ok2 := tmp[0].(string); ok2 {
+                                       filter.Attr = attr
+                               } else {
+                                       return resp, fmt.Errorf("filter unparsable: attribute must be string: %T, %+v, filter: %T, %+v\n", tmp[0], tmp[0], f, f)
+                               }
+                               if operator, ok2 := tmp[1].(string); ok2 {
+                                       filter.Operator = operator
+                               } else {
+                                       return resp, fmt.Errorf("filter unparsable: operator must be string: %T, %+v, filter: %T, %+v\n", tmp[1], tmp[1], f, f)
+                               }
+                               filter.Operand = tmp[2]
+                               options.Filters = append(options.Filters, filter)
+                       }
+               } else {
+                       return resp, fmt.Errorf("filter unparsable: not an array\n")
+               }
+               // Use the generic /groups/contents endpoint for filter groups
+               options.UUID = ""
+       }
+
+       return conn.railsProxy.GroupContents(ctx, options)
+}
diff --git a/lib/controller/localdb/log_activity.go b/lib/controller/localdb/log_activity.go

new file mode 100644 (file)

index 0000000..9c9660a
--- /dev/null
+++ b/lib/controller/localdb/log_activity.go
@@ -0,0 +1,117 @@
+// Copyright (C) The Arvados Authors. All rights reserved.
+//
+// SPDX-License-Identifier: AGPL-3.0
+
+package localdb
+
+import (
+       "context"
+       "time"
+
+       "git.arvados.org/arvados.git/lib/ctrlctx"
+       "git.arvados.org/arvados.git/sdk/go/arvados"
+       "git.arvados.org/arvados.git/sdk/go/ctxlog"
+)
+
+func (conn *Conn) logActivity(ctx context.Context) {
+       p := conn.cluster.Users.ActivityLoggingPeriod.Duration()
+       if p < 1 {
+               ctxlog.FromContext(ctx).Debug("logActivity disabled by config")
+               return
+       }
+       user, _, err := ctrlctx.CurrentAuth(ctx)
+       if err == ctrlctx.ErrUnauthenticated {
+               ctxlog.FromContext(ctx).Debug("logActivity skipped for unauthenticated request")
+               return
+       } else if err != nil {
+               ctxlog.FromContext(ctx).WithError(err).Error("logActivity CurrentAuth failed")
+               return
+       }
+       now := time.Now()
+       conn.activeUsersLock.Lock()
+       if conn.activeUsers == nil || conn.activeUsersReset.IsZero() || conn.activeUsersReset.Before(now) {
+               conn.activeUsersReset = alignedPeriod(now, p)
+               conn.activeUsers = map[string]bool{}
+       }
+       logged := conn.activeUsers[user.UUID]
+       if !logged {
+               // Prevent other concurrent calls from logging about
+               // this user until we finish.
+               conn.activeUsers[user.UUID] = true
+       }
+       conn.activeUsersLock.Unlock()
+       if logged {
+               return
+       }
+       defer func() {
+               // If we return without logging, reset the flag so we
+               // try again on the user's next API call.
+               if !logged {
+                       conn.activeUsersLock.Lock()
+                       conn.activeUsers[user.UUID] = false
+                       conn.activeUsersLock.Unlock()
+               }
+       }()
+
+       tx, err := ctrlctx.NewTx(ctx)
+       if err != nil {
+               ctxlog.FromContext(ctx).WithError(err).Error("logActivity NewTx failed")
+               return
+       }
+       defer tx.Rollback()
+       _, err = tx.ExecContext(ctx, `
+insert into logs
+ (uuid,
+  owner_uuid, modified_by_user_uuid, object_owner_uuid,
+  event_type,
+  summary,
+  object_uuid,
+  properties,
+  event_at, created_at, updated_at, modified_at)
+ values
+ ($1, $2, $2, $2, $3, $4, $5, $6,
+  current_timestamp at time zone 'UTC',
+  current_timestamp at time zone 'UTC',
+  current_timestamp at time zone 'UTC',
+  current_timestamp at time zone 'UTC')
+ returning id`,
+               arvados.RandomUUID(conn.cluster.ClusterID, "57u5n"),
+               conn.cluster.ClusterID+"-tpzed-000000000000000", // both modified_by and object_owner
+               "activity",
+               "activity of "+user.UUID,
+               user.UUID,
+               "{}")
+       if err != nil {
+               ctxlog.FromContext(ctx).WithError(err).Error("logActivity query failed")
+               return
+       }
+       err = tx.Commit()
+       if err != nil {
+               ctxlog.FromContext(ctx).WithError(err).Error("logActivity commit failed")
+               return
+       }
+       logged = true
+}
+
+// alignedPeriod computes a time interval that includes now and aligns
+// to local clock times that are multiples of p. For example, if local
+// time is UTC-5 and ActivityLoggingPeriod=4h, periodStart and
+// periodEnd will be 0000-0400, 0400-0800, etc., in local time. If p
+// is a multiple of 24h, periods will start and end at midnight.
+//
+// If DST starts or ends during this period, the boundaries will be
+// aligned based on either DST or non-DST time depending on whether
+// now is before or after the DST transition. The consequences are
+// presumed to be inconsequential, e.g., logActivity may unnecessarily
+// log activity more than once in a period that includes a DST
+// transition.
+//
+// In all cases, the period ends in the future.
+//
+// Only the end of the period is returned.
+func alignedPeriod(now time.Time, p time.Duration) time.Time {
+       _, tzsec := now.Zone()
+       tzoff := time.Duration(tzsec) * time.Second
+       periodStart := now.Add(tzoff).Truncate(p).Add(-tzoff)
+       return periodStart.Add(p)
+}
diff --git a/lib/controller/localdb/log_activity_test.go b/lib/controller/localdb/log_activity_test.go

new file mode 100644 (file)

index 0000000..ea7f234
--- /dev/null
+++ b/lib/controller/localdb/log_activity_test.go
@@ -0,0 +1,87 @@
+// Copyright (C) The Arvados Authors. All rights reserved.
+//
+// SPDX-License-Identifier: AGPL-3.0
+
+package localdb
+
+import (
+       "context"
+       "database/sql"
+       "time"
+
+       "git.arvados.org/arvados.git/lib/controller/api"
+       "git.arvados.org/arvados.git/lib/ctrlctx"
+       "git.arvados.org/arvados.git/sdk/go/arvados"
+       "git.arvados.org/arvados.git/sdk/go/arvadostest"
+       "git.arvados.org/arvados.git/sdk/go/auth"
+       "github.com/jmoiron/sqlx"
+       check "gopkg.in/check.v1"
+)
+
+var _ = check.Suite(&activityPeriodSuite{})
+
+type activityPeriodSuite struct{}
+
+// The important thing is that, even when daylight savings time is
+// making things difficult, the current period ends in the future.
+func (*activityPeriodSuite) TestPeriod(c *check.C) {
+       toronto, err := time.LoadLocation("America/Toronto")
+       c.Assert(err, check.IsNil)
+
+       format := "2006-01-02 15:04:05 MST"
+       dststartday, err := time.ParseInLocation(format, "2022-03-13 00:00:00 EST", toronto)
+       c.Assert(err, check.IsNil)
+       dstendday, err := time.ParseInLocation(format, "2022-11-06 00:00:00 EDT", toronto)
+       c.Assert(err, check.IsNil)
+
+       for _, period := range []time.Duration{
+               time.Minute * 13,
+               time.Minute * 49,
+               time.Hour,
+               4 * time.Hour,
+               48 * time.Hour,
+       } {
+               for offset := time.Duration(0); offset < 48*time.Hour; offset += 3 * time.Minute {
+                       t := dststartday.Add(offset)
+                       end := alignedPeriod(t, period)
+                       c.Check(end.After(t), check.Equals, true, check.Commentf("period %v offset %v", period, offset))
+
+                       t = dstendday.Add(offset)
+                       end = alignedPeriod(t, period)
+                       c.Check(end.After(t), check.Equals, true, check.Commentf("period %v offset %v", period, offset))
+               }
+       }
+}
+
+func (s *CollectionSuite) TestLogActivity(c *check.C) {
+       starttime := time.Now()
+       s.localdb.activeUsersLock.Lock()
+       s.localdb.activeUsersReset = starttime
+       s.localdb.activeUsersLock.Unlock()
+       db := arvadostest.DB(c, s.cluster)
+       wrap := api.ComposeWrappers(
+               ctrlctx.WrapCallsInTransactions(func(ctx context.Context) (*sqlx.DB, error) { return db, nil }),
+               ctrlctx.WrapCallsWithAuth(s.cluster))
+       collectionCreate := wrap(func(ctx context.Context, opts interface{}) (interface{}, error) {
+               return s.localdb.CollectionCreate(ctx, opts.(arvados.CreateOptions))
+       })
+       ctx := auth.NewContext(context.Background(), &auth.Credentials{Tokens: []string{arvadostest.ActiveTokenV2}})
+       for i := 0; i < 2; i++ {
+               logthreshold := time.Now()
+               _, err := collectionCreate(ctx, arvados.CreateOptions{
+                       Attrs: map[string]interface{}{
+                               "name": "test collection",
+                       },
+                       EnsureUniqueName: true,
+               })
+               c.Assert(err, check.IsNil)
+               var uuid string
+               err = db.QueryRowContext(ctx, `select uuid from logs where object_uuid = $1 and event_at > $2`, arvadostest.ActiveUserUUID, logthreshold.UTC()).Scan(&uuid)
+               if i == 0 {
+                       c.Check(err, check.IsNil)
+                       c.Check(uuid, check.HasLen, 27)
+               } else {
+                       c.Check(err, check.Equals, sql.ErrNoRows)
+               }
+       }
+}
diff --git a/lib/controller/localdb/login.go b/lib/controller/localdb/login.go

index 2b20491a04a426f50dbb354b9c8e0a7e86f833ea..a1ac2c55b02657462ce1c78d860df4a4fdc94186 100644 (file)
--- a/lib/controller/localdb/login.go
+++ b/lib/controller/localdb/login.go
@@ -10,6 +10,7 @@ import (
         "encoding/json"
         "errors"
         "fmt"
+       "net"
         "net/http"
         "net/url"
         "strings"
@@ -162,3 +163,39 @@ func (conn *Conn) CreateAPIClientAuthorization(ctx context.Context, rootToken st
         }
         return
  }
+
+func validateLoginRedirectTarget(cluster *arvados.Cluster, returnTo string) error {
+       u, err := url.Parse(returnTo)
+       if err != nil {
+               return err
+       }
+       u, err = u.Parse("/")
+       if err != nil {
+               return err
+       }
+       if u.Port() == "80" && u.Scheme == "http" {
+               u.Host = u.Hostname()
+       } else if u.Port() == "443" && u.Scheme == "https" {
+               u.Host = u.Hostname()
+       }
+       if _, ok := cluster.Login.TrustedClients[arvados.URL(*u)]; ok {
+               return nil
+       }
+       if u.String() == cluster.Services.Workbench1.ExternalURL.String() ||
+               u.String() == cluster.Services.Workbench2.ExternalURL.String() {
+               return nil
+       }
+       if cluster.Login.TrustPrivateNetworks {
+               if u.Hostname() == "localhost" {
+                       return nil
+               }
+               if ip := net.ParseIP(u.Hostname()); len(ip) > 0 {
+                       for _, n := range privateNetworks {
+                               if n.Contains(ip) {
+                                       return nil
+                               }
+                       }
+               }
+       }
+       return fmt.Errorf("requesting site is not listed in TrustedClients config")
+}
diff --git a/lib/controller/localdb/login_oidc.go b/lib/controller/localdb/login_oidc.go

index 6d6f80f39c70ac5427578ddd6ed5eb3e78b6a136..05e5e243b99d574fa4956e41cfcaee8c24cbe5ab 100644 (file)
--- a/lib/controller/localdb/login_oidc.go
+++ b/lib/controller/localdb/login_oidc.go
@@ -116,6 +116,9 @@ func (ctrl *oidcLoginController) Login(ctx context.Context, opts arvados.LoginOp
                 if opts.ReturnTo == "" {
                         return loginError(errors.New("missing return_to parameter"))
                 }
+               if err := validateLoginRedirectTarget(ctrl.Parent.cluster, opts.ReturnTo); err != nil {
+                       return loginError(fmt.Errorf("invalid return_to parameter: %s", err))
+               }
                 state := ctrl.newOAuth2State([]byte(ctrl.Cluster.SystemRootToken), opts.Remote, opts.ReturnTo)
                 var authparams []oauth2.AuthCodeOption
                 for k, v := range ctrl.AuthParams {
diff --git a/lib/controller/localdb/login_oidc_test.go b/lib/controller/localdb/login_oidc_test.go

index b9f0f56e058482eb74eb527b038136e56979feff..0fe3bdf7f6b684652cad9c71f3c0a63fba15b925 100644 (file)
--- a/lib/controller/localdb/login_oidc_test.go
+++ b/lib/controller/localdb/login_oidc_test.go
@@ -42,6 +42,7 @@ type OIDCLoginSuite struct {
         cluster      *arvados.Cluster
         localdb      *Conn
         railsSpy     *arvadostest.Proxy
+       trustedURL   *arvados.URL
         fakeProvider *arvadostest.OIDCProvider
  }
  
@@ -53,6 +54,8 @@ func (s *OIDCLoginSuite) TearDownSuite(c *check.C) {
  }
  
  func (s *OIDCLoginSuite) SetUpTest(c *check.C) {
+       s.trustedURL = &arvados.URL{Scheme: "https", Host: "app.example.com", Path: "/"}
+
         s.fakeProvider = arvadostest.NewOIDCProvider(c)
         s.fakeProvider.AuthEmail = "active-user@arvados.local"
         s.fakeProvider.AuthEmailVerified = true
@@ -70,6 +73,7 @@ func (s *OIDCLoginSuite) SetUpTest(c *check.C) {
         s.cluster.Login.Google.Enable = true
         s.cluster.Login.Google.ClientID = "test%client$id"
         s.cluster.Login.Google.ClientSecret = "test#client/secret"
+       s.cluster.Login.TrustedClients = map[arvados.URL]struct{}{*s.trustedURL: {}}
         s.cluster.Users.PreferDomainForUsername = "PreferDomainForUsername.example.com"
         s.fakeProvider.ValidClientID = "test%client$id"
         s.fakeProvider.ValidClientSecret = "test#client/secret"
@@ -88,9 +92,26 @@ func (s *OIDCLoginSuite) TearDownTest(c *check.C) {
  }
  
  func (s *OIDCLoginSuite) TestGoogleLogout(c *check.C) {
+       s.cluster.Login.TrustedClients[arvados.URL{Scheme: "https", Host: "foo.example", Path: "/"}] = struct{}{}
+       s.cluster.Login.TrustPrivateNetworks = false
+
         resp, err := s.localdb.Logout(context.Background(), arvados.LogoutOptions{ReturnTo: "https://foo.example.com/bar"})
+       c.Check(err, check.NotNil)
+       c.Check(resp.RedirectLocation, check.Equals, "")
+
+       resp, err = s.localdb.Logout(context.Background(), arvados.LogoutOptions{ReturnTo: "https://127.0.0.1/bar"})
+       c.Check(err, check.NotNil)
+       c.Check(resp.RedirectLocation, check.Equals, "")
+
+       resp, err = s.localdb.Logout(context.Background(), arvados.LogoutOptions{ReturnTo: "https://foo.example/bar"})
+       c.Check(err, check.IsNil)
+       c.Check(resp.RedirectLocation, check.Equals, "https://foo.example/bar")
+
+       s.cluster.Login.TrustPrivateNetworks = true
+
+       resp, err = s.localdb.Logout(context.Background(), arvados.LogoutOptions{ReturnTo: "https://192.168.1.1/bar"})
         c.Check(err, check.IsNil)
-       c.Check(resp.RedirectLocation, check.Equals, "https://foo.example.com/bar")
+       c.Check(resp.RedirectLocation, check.Equals, "https://192.168.1.1/bar")
  }
  
  func (s *OIDCLoginSuite) TestGoogleLogin_Start_Bogus(c *check.C) {
@@ -118,6 +139,13 @@ func (s *OIDCLoginSuite) TestGoogleLogin_Start(c *check.C) {
         }
  }
  
+func (s *OIDCLoginSuite) TestGoogleLogin_UnknownClient(c *check.C) {
+       resp, err := s.localdb.Login(context.Background(), arvados.LoginOptions{ReturnTo: "https://bad-app.example.com/foo?bar"})
+       c.Check(err, check.IsNil)
+       c.Check(resp.RedirectLocation, check.Equals, "")
+       c.Check(resp.HTML.String(), check.Matches, `(?ms).*requesting site is not listed in TrustedClients.*`)
+}
+
  func (s *OIDCLoginSuite) TestGoogleLogin_InvalidCode(c *check.C) {
         state := s.startLogin(c)
         resp, err := s.localdb.Login(context.Background(), arvados.LoginOptions{
@@ -613,10 +641,14 @@ func (s *OIDCLoginSuite) startLogin(c *check.C, checks ...func(url.Values)) (sta
         // the provider, just grab state from the redirect URL.
         resp, err := s.localdb.Login(context.Background(), arvados.LoginOptions{ReturnTo: "https://app.example.com/foo?bar"})
         c.Check(err, check.IsNil)
+       c.Check(resp.HTML.String(), check.Not(check.Matches), `(?ms).*error:.*`)
         target, err := url.Parse(resp.RedirectLocation)
         c.Check(err, check.IsNil)
         state = target.Query().Get("state")
-       c.Check(state, check.Not(check.Equals), "")
+       if !c.Check(state, check.Not(check.Equals), "") {
+               c.Logf("Redirect target: %q", target)
+               c.Logf("HTML: %q", resp.HTML)
+       }
         for _, fn := range checks {
                 fn(target.Query())
         }
@@ -624,6 +656,56 @@ func (s *OIDCLoginSuite) startLogin(c *check.C, checks ...func(url.Values)) (sta
         return
  }
  
+func (s *OIDCLoginSuite) TestValidateLoginRedirectTarget(c *check.C) {
+       for _, trial := range []struct {
+               permit       bool
+               trustPrivate bool
+               url          string
+       }{
+               // wb1, wb2 => accept
+               {true, false, s.cluster.Services.Workbench1.ExternalURL.String()},
+               {true, false, s.cluster.Services.Workbench2.ExternalURL.String()},
+               // explicitly listed host => accept
+               {true, false, "https://app.example.com/"},
+               {true, false, "https://app.example.com:443/foo?bar=baz"},
+               // non-listed hostname => deny (regardless of TrustPrivateNetworks)
+               {false, false, "https://bad.example/"},
+               {false, true, "https://bad.example/"},
+               // non-listed non-private IP addr => deny (regardless of TrustPrivateNetworks)
+               {false, true, "https://1.2.3.4/"},
+               {false, true, "https://1.2.3.4/"},
+               {false, true, "https://[ab::cd]:1234/"},
+               // localhost or non-listed private IP addr => accept only if TrustPrivateNetworks is set
+               {false, false, "https://localhost/"},
+               {true, true, "https://localhost/"},
+               {false, false, "https://[10.9.8.7]:80/foo"},
+               {true, true, "https://[10.9.8.7]:80/foo"},
+               {false, false, "https://[::1]:80/foo"},
+               {true, true, "https://[::1]:80/foo"},
+               {true, true, "http://192.168.1.1/"},
+               {true, true, "http://172.17.2.0/"},
+               // bad url => deny
+               {false, true, "https://10.1.1.1:blorp/foo"},        // non-numeric port
+               {false, true, "https://app.example.com:blorp/foo"}, // non-numeric port
+               {false, true, "https://]:443"},
+               {false, true, "https://"},
+               {false, true, "https:"},
+               {false, true, ""},
+               // explicitly listed host but different port, protocol, or user/pass => deny
+               {false, true, "http://app.example.com/"},
+               {false, true, "http://app.example.com:443/"},
+               {false, true, "https://app.example.com:80/"},
+               {false, true, "https://app.example.com:4433/"},
+               {false, true, "https://u:p@app.example.com:443/foo?bar=baz"},
+       } {
+               c.Logf("trial %+v", trial)
+               s.cluster.Login.TrustPrivateNetworks = trial.trustPrivate
+               err := validateLoginRedirectTarget(s.cluster, trial.url)
+               c.Check(err == nil, check.Equals, trial.permit)
+       }
+
+}
+
  func getCallbackAuthInfo(c *check.C, railsSpy *arvadostest.Proxy) (authinfo rpc.UserSessionAuthInfo) {
         for _, dump := range railsSpy.RequestDumps {
                 c.Logf("spied request: %q", dump)
diff --git a/lib/controller/localdb/login_testuser_test.go b/lib/controller/localdb/login_testuser_test.go

index 51c2416f59bcb7c2c7f55e9425489ae003653ee5..8717617889bcd8d8fbf5a3e8e43c4d6852834a70 100644 (file)
--- a/lib/controller/localdb/login_testuser_test.go
+++ b/lib/controller/localdb/login_testuser_test.go
@@ -103,7 +103,8 @@ func (s *TestUserSuite) TestLoginForm(c *check.C) {
  }
  
  func (s *TestUserSuite) TestExpireTokenOnLogout(c *check.C) {
-       returnTo := "https://localhost:12345/logout"
+       s.cluster.Login.TrustPrivateNetworks = true
+       returnTo := "https://[::1]:12345/logout"
         for _, trial := range []struct {
                 requestToken      string
                 expiringTokenUUID string
diff --git a/lib/controller/localdb/logout.go b/lib/controller/localdb/logout.go

index e1603f14485eb0a4f664a2a00b080a1497c64d2a..04e7681ad7bef728bb11e5c745c2b8391094b2d5 100644 (file)
--- a/lib/controller/localdb/logout.go
+++ b/lib/controller/localdb/logout.go
@@ -33,6 +33,8 @@ func logout(ctx context.Context, cluster *arvados.Cluster, opts arvados.LogoutOp
                 } else {
                         target = cluster.Services.Workbench1.ExternalURL.String()
                 }
+       } else if err := validateLoginRedirectTarget(cluster, target); err != nil {
+               return arvados.LogoutResponse{}, httpserver.ErrorWithStatus(fmt.Errorf("invalid return_to parameter: %s", err), http.StatusBadRequest)
         }
         return arvados.LogoutResponse{RedirectLocation: target}, nil
  }
diff --git a/lib/controller/router/router.go b/lib/controller/router/router.go

index 80d5e929850cd18df389daeddb18eb4b12387a38..d4712558eae07c8ddd2a369ae40e8ce4ba55da0c 100644 (file)
--- a/lib/controller/router/router.go
+++ b/lib/controller/router/router.go
@@ -367,6 +367,41 @@ func (rtr *router) addRoutes() {
                                 return rtr.backend.LinkDelete(ctx, *opts.(*arvados.DeleteOptions))
                         },
                 },
+               {
+                       arvados.EndpointLogCreate,
+                       func() interface{} { return &arvados.CreateOptions{} },
+                       func(ctx context.Context, opts interface{}) (interface{}, error) {
+                               return rtr.backend.LogCreate(ctx, *opts.(*arvados.CreateOptions))
+                       },
+               },
+               {
+                       arvados.EndpointLogUpdate,
+                       func() interface{} { return &arvados.UpdateOptions{} },
+                       func(ctx context.Context, opts interface{}) (interface{}, error) {
+                               return rtr.backend.LogUpdate(ctx, *opts.(*arvados.UpdateOptions))
+                       },
+               },
+               {
+                       arvados.EndpointLogList,
+                       func() interface{} { return &arvados.ListOptions{Limit: -1} },
+                       func(ctx context.Context, opts interface{}) (interface{}, error) {
+                               return rtr.backend.LogList(ctx, *opts.(*arvados.ListOptions))
+                       },
+               },
+               {
+                       arvados.EndpointLogGet,
+                       func() interface{} { return &arvados.GetOptions{} },
+                       func(ctx context.Context, opts interface{}) (interface{}, error) {
+                               return rtr.backend.LogGet(ctx, *opts.(*arvados.GetOptions))
+                       },
+               },
+               {
+                       arvados.EndpointLogDelete,
+                       func() interface{} { return &arvados.DeleteOptions{} },
+                       func(ctx context.Context, opts interface{}) (interface{}, error) {
+                               return rtr.backend.LogDelete(ctx, *opts.(*arvados.DeleteOptions))
+                       },
+               },
                 {
                         arvados.EndpointSpecimenCreate,
                         func() interface{} { return &arvados.CreateOptions{} },
diff --git a/lib/controller/rpc/conn.go b/lib/controller/rpc/conn.go

index 0e532f23c070d8b5c64a15bd8bef46494702ae5a..4d8a82ce43ef6b5a3f47d100f509ebd03895c43d 100644 (file)
--- a/lib/controller/rpc/conn.go
+++ b/lib/controller/rpc/conn.go
@@ -559,6 +559,41 @@ func (conn *Conn) LinkDelete(ctx context.Context, options arvados.DeleteOptions)
         return resp, err
  }
  
+func (conn *Conn) LogCreate(ctx context.Context, options arvados.CreateOptions) (arvados.Log, error) {
+       ep := arvados.EndpointLogCreate
+       var resp arvados.Log
+       err := conn.requestAndDecode(ctx, &resp, ep, nil, options)
+       return resp, err
+}
+
+func (conn *Conn) LogUpdate(ctx context.Context, options arvados.UpdateOptions) (arvados.Log, error) {
+       ep := arvados.EndpointLogUpdate
+       var resp arvados.Log
+       err := conn.requestAndDecode(ctx, &resp, ep, nil, options)
+       return resp, err
+}
+
+func (conn *Conn) LogGet(ctx context.Context, options arvados.GetOptions) (arvados.Log, error) {
+       ep := arvados.EndpointLogGet
+       var resp arvados.Log
+       err := conn.requestAndDecode(ctx, &resp, ep, nil, options)
+       return resp, err
+}
+
+func (conn *Conn) LogList(ctx context.Context, options arvados.ListOptions) (arvados.LogList, error) {
+       ep := arvados.EndpointLogList
+       var resp arvados.LogList
+       err := conn.requestAndDecode(ctx, &resp, ep, nil, options)
+       return resp, err
+}
+
+func (conn *Conn) LogDelete(ctx context.Context, options arvados.DeleteOptions) (arvados.Log, error) {
+       ep := arvados.EndpointLogDelete
+       var resp arvados.Log
+       err := conn.requestAndDecode(ctx, &resp, ep, nil, options)
+       return resp, err
+}
+
  func (conn *Conn) SpecimenCreate(ctx context.Context, options arvados.CreateOptions) (arvados.Specimen, error) {
         ep := arvados.EndpointSpecimenCreate
         var resp arvados.Specimen
diff --git a/lib/controller/trash.go b/lib/controller/trash.go

index 551b2f92bbde209b984656728388ca48a2b9c294..99e7aec0b66c4dbed9462c498ece37e38971157b 100644 (file)
--- a/lib/controller/trash.go
+++ b/lib/controller/trash.go
@@ -5,6 +5,7 @@
  package controller
  
  import (
+       "context"
         "time"
  
         "git.arvados.org/arvados.git/lib/controller/dblock"
@@ -12,22 +13,62 @@ import (
         "git.arvados.org/arvados.git/sdk/go/ctxlog"
  )
  
-func (h *Handler) trashSweepWorker() {
-       sleep := h.Cluster.Collections.TrashSweepInterval.Duration()
-       logger := ctxlog.FromContext(h.BackgroundContext).WithField("worker", "trash sweep")
+func (h *Handler) periodicWorker(workerName string, interval time.Duration, locker *dblock.DBLocker, run func(context.Context) error) {
+       logger := ctxlog.FromContext(h.BackgroundContext).WithField("worker", workerName)
         ctx := ctxlog.Context(h.BackgroundContext, logger)
-       if sleep <= 0 {
-               logger.Debugf("Collections.TrashSweepInterval is %v, not running worker", sleep)
+       if interval <= 0 {
+               logger.Debugf("interval is %v, not running worker", interval)
                 return
         }
-       dblock.TrashSweep.Lock(ctx, h.db)
-       defer dblock.TrashSweep.Unlock()
-       for time.Sleep(sleep); ctx.Err() == nil; time.Sleep(sleep) {
-               dblock.TrashSweep.Check()
-               ctx := auth.NewContext(ctx, &auth.Credentials{Tokens: []string{h.Cluster.SystemRootToken}})
-               _, err := h.federation.SysTrashSweep(ctx, struct{}{})
+       if !locker.Lock(ctx, h.dbConnector.GetDB) {
+               // context canceled
+               return
+       }
+       defer locker.Unlock()
+       for time.Sleep(interval); ctx.Err() == nil; time.Sleep(interval) {
+               if !locker.Check() {
+                       // context canceled
+                       return
+               }
+               err := run(ctx)
                 if err != nil {
-                       logger.WithError(err).Info("trash sweep failed")
+                       logger.WithError(err).Infof("%s failed", workerName)
                 }
         }
  }
+
+func (h *Handler) trashSweepWorker() {
+       h.periodicWorker("trash sweep", h.Cluster.Collections.TrashSweepInterval.Duration(), dblock.TrashSweep, func(ctx context.Context) error {
+               ctx = auth.NewContext(ctx, &auth.Credentials{Tokens: []string{h.Cluster.SystemRootToken}})
+               _, err := h.federation.SysTrashSweep(ctx, struct{}{})
+               return err
+       })
+}
+
+func (h *Handler) containerLogSweepWorker() {
+       h.periodicWorker("container log sweep", h.Cluster.Containers.Logging.SweepInterval.Duration(), dblock.ContainerLogSweep, func(ctx context.Context) error {
+               db, err := h.dbConnector.GetDB(ctx)
+               if err != nil {
+                       return err
+               }
+               res, err := db.ExecContext(ctx, `
+DELETE FROM logs
+ USING containers
+ WHERE logs.object_uuid=containers.uuid
+ AND logs.event_type in ('stdout', 'stderr', 'arv-mount', 'crunch-run', 'crunchstat', 'hoststat', 'node', 'container', 'keepstore')
+ AND containers.log IS NOT NULL
+ AND now() - containers.finished_at > $1::interval`,
+                       h.Cluster.Containers.Logging.MaxAge.String())
+               if err != nil {
+                       return err
+               }
+               logger := ctxlog.FromContext(ctx)
+               rows, err := res.RowsAffected()
+               if err != nil {
+                       logger.WithError(err).Warn("unexpected error from RowsAffected()")
+               } else {
+                       logger.WithField("rows", rows).Info("deleted rows from logs table")
+               }
+               return nil
+       })
+}
diff --git a/lib/crunchrun/crunchrun.go b/lib/crunchrun/crunchrun.go

index ee9115d8d809903be17cbaa10dc4010d1b7d87dc..51e154c0ecfb3b978844947480f1efe7fe2f6fa9 100644 (file)
--- a/lib/crunchrun/crunchrun.go
+++ b/lib/crunchrun/crunchrun.go
@@ -142,6 +142,7 @@ type ContainerRunner struct {
         parentTemp    string
         costStartTime time.Time
  
+       keepstore        *exec.Cmd
         keepstoreLogger  io.WriteCloser
         keepstoreLogbuf  *bufThenWrite
         statLogger       io.WriteCloser
@@ -427,7 +428,13 @@ func (runner *ContainerRunner) SetupMounts() (map[string]bindmount, error) {
                 arvMountCmd = append(arvMountCmd, "--allow-other")
         }
  
-       if runner.Container.RuntimeConstraints.KeepCacheRAM > 0 {
+       if runner.Container.RuntimeConstraints.KeepCacheDisk > 0 {
+               keepcachedir, err := runner.MkTempDir(runner.parentTemp, "keepcache")
+               if err != nil {
+                       return nil, fmt.Errorf("while creating keep cache temp dir: %v", err)
+               }
+               arvMountCmd = append(arvMountCmd, "--disk-cache", "--disk-cache-dir", keepcachedir, "--file-cache", fmt.Sprintf("%d", runner.Container.RuntimeConstraints.KeepCacheDisk))
+       } else if runner.Container.RuntimeConstraints.KeepCacheRAM > 0 {
                 arvMountCmd = append(arvMountCmd, "--file-cache", fmt.Sprintf("%d", runner.Container.RuntimeConstraints.KeepCacheRAM))
         }
  
@@ -660,6 +667,9 @@ func (runner *ContainerRunner) SetupMounts() (map[string]bindmount, error) {
         if err != nil {
                 return nil, fmt.Errorf("while trying to start arv-mount: %v", err)
         }
+       if runner.hoststatReporter != nil && runner.ArvMount != nil {
+               runner.hoststatReporter.ReportPID("arv-mount", runner.ArvMount.Process.Pid)
+       }
  
         for _, p := range collectionPaths {
                 _, err = os.Stat(p)
@@ -733,6 +743,7 @@ func (runner *ContainerRunner) startHoststat() error {
                 PollPeriod: runner.statInterval,
         }
         runner.hoststatReporter.Start()
+       runner.hoststatReporter.ReportPID("crunch-run", os.Getpid())
         return nil
  }
  
@@ -1569,6 +1580,9 @@ func (runner *ContainerRunner) Run() (err error) {
         if err != nil {
                 return
         }
+       if runner.keepstore != nil {
+               runner.hoststatReporter.ReportPID("keepstore", runner.keepstore.Process.Pid)
+       }
  
         // set up FUSE mount and binds
         bindmounts, err = runner.SetupMounts()
@@ -1853,6 +1867,7 @@ func (command) RunCommand(prog string, args []string, stdin io.Reader, stdout, s
                 return 1
         }
  
+       cr.keepstore = keepstore
         if keepstore == nil {
                 // Log explanation (if any) for why we're not running
                 // a local keepstore.
diff --git a/lib/crunchstat/crunchstat.go b/lib/crunchstat/crunchstat.go

index 10cd7cfce43a03472e2e942b68512efcdd7d0c61..3a473cab8715c49eec14d5e0565b61daf9d71a5e 100644 (file)
--- a/lib/crunchstat/crunchstat.go
+++ b/lib/crunchstat/crunchstat.go
@@ -13,10 +13,12 @@ import (
         "fmt"
         "io"
         "io/ioutil"
-       "log"
         "os"
+       "regexp"
+       "sort"
         "strconv"
         "strings"
+       "sync"
         "syscall"
         "time"
  )
@@ -47,14 +49,20 @@ type Reporter struct {
         TempDir string
  
         // Where to write statistics. Must not be nil.
-       Logger *log.Logger
+       Logger interface {
+               Printf(fmt string, args ...interface{})
+       }
  
+       kernelPageSize      int64
         reportedStatFile    map[string]string
         lastNetSample       map[string]ioSample
         lastDiskIOSample    map[string]ioSample
         lastCPUSample       cpuSample
         lastDiskSpaceSample diskSpaceSample
  
+       reportPIDs   map[string]int
+       reportPIDsMu sync.Mutex
+
         done    chan struct{} // closed when we should stop reporting
         flushed chan struct{} // closed when we have made our last report
  }
@@ -76,6 +84,17 @@ func (r *Reporter) Start() {
         go r.run()
  }
  
+// ReportPID starts reporting stats for a specified process.
+func (r *Reporter) ReportPID(name string, pid int) {
+       r.reportPIDsMu.Lock()
+       defer r.reportPIDsMu.Unlock()
+       if r.reportPIDs == nil {
+               r.reportPIDs = map[string]int{name: pid}
+       } else {
+               r.reportPIDs[name] = pid
+       }
+}
+
  // Stop reporting. Do not call more than once, or before calling
  // Start.
  //
@@ -256,6 +275,71 @@ func (r *Reporter) doMemoryStats() {
                 }
         }
         r.Logger.Printf("mem%s\n", outstat.String())
+
+       if r.kernelPageSize == 0 {
+               // assign "don't try again" value in case we give up
+               // and return without assigning the real value
+               r.kernelPageSize = -1
+               buf, err := os.ReadFile("/proc/self/smaps")
+               if err != nil {
+                       r.Logger.Printf("error reading /proc/self/smaps: %s", err)
+                       return
+               }
+               m := regexp.MustCompile(`\nKernelPageSize:\s*(\d+) kB\n`).FindSubmatch(buf)
+               if len(m) != 2 {
+                       r.Logger.Printf("error parsing /proc/self/smaps: KernelPageSize not found")
+                       return
+               }
+               size, err := strconv.ParseInt(string(m[1]), 10, 64)
+               if err != nil {
+                       r.Logger.Printf("error parsing /proc/self/smaps: KernelPageSize %q: %s", m[1], err)
+                       return
+               }
+               r.kernelPageSize = size * 1024
+       } else if r.kernelPageSize < 0 {
+               // already failed to determine page size, don't keep
+               // trying/logging
+               return
+       }
+
+       r.reportPIDsMu.Lock()
+       defer r.reportPIDsMu.Unlock()
+       procnames := make([]string, 0, len(r.reportPIDs))
+       for name := range r.reportPIDs {
+               procnames = append(procnames, name)
+       }
+       sort.Strings(procnames)
+       procmem := ""
+       for _, procname := range procnames {
+               pid := r.reportPIDs[procname]
+               buf, err := os.ReadFile(fmt.Sprintf("/proc/%d/stat", pid))
+               if err != nil {
+                       continue
+               }
+               // If the executable name contains a ')' char,
+               // /proc/$pid/stat will look like '1234 (exec name)) S
+               // 123 ...' -- the last ')' is the end of the 2nd
+               // field.
+               paren := bytes.LastIndexByte(buf, ')')
+               if paren < 0 {
+                       continue
+               }
+               fields := bytes.SplitN(buf[paren:], []byte{' '}, 24)
+               if len(fields) < 24 {
+                       continue
+               }
+               // rss is the 24th field in .../stat, and fields[0]
+               // here is the last char ')' of the 2nd field, so
+               // rss is fields[22]
+               rss, err := strconv.ParseInt(string(fields[22]), 10, 64)
+               if err != nil {
+                       continue
+               }
+               procmem += fmt.Sprintf(" %d %s", rss*r.kernelPageSize, procname)
+       }
+       if procmem != "" {
+               r.Logger.Printf("procmem%s\n", procmem)
+       }
  }
  
  func (r *Reporter) doNetworkStats() {
diff --git a/lib/crunchstat/crunchstat_test.go b/lib/crunchstat/crunchstat_test.go

index c27e39241df08af2c925a791e6fd849afc496b90..5e8e93de6cfae9ce3f51c7b191e515ff8e7d9955 100644 (file)
--- a/lib/crunchstat/crunchstat_test.go
+++ b/lib/crunchstat/crunchstat_test.go
@@ -5,62 +5,81 @@
  package crunchstat
  
  import (
-       "bufio"
-       "io"
+       "bytes"
         "log"
         "os"
         "regexp"
+       "strconv"
         "testing"
+       "time"
+
+       "github.com/sirupsen/logrus"
+       . "gopkg.in/check.v1"
  )
  
-func bufLogger() (*log.Logger, *bufio.Reader) {
-       r, w := io.Pipe()
-       logger := log.New(w, "", 0)
-       return logger, bufio.NewReader(r)
+func Test(t *testing.T) {
+       TestingT(t)
  }
  
-func TestReadAllOrWarnFail(t *testing.T) {
-       logger, rcv := bufLogger()
-       rep := Reporter{Logger: logger}
+var _ = Suite(&suite{})
  
-       done := make(chan bool)
-       var msg []byte
-       var err error
-       go func() {
-               msg, err = rcv.ReadBytes('\n')
-               close(done)
-       }()
-       {
-               // The special file /proc/self/mem can be opened for
-               // reading, but reading from byte 0 returns an error.
-               f, err := os.Open("/proc/self/mem")
-               if err != nil {
-                       t.Fatalf("Opening /proc/self/mem: %s", err)
-               }
-               if x, err := rep.readAllOrWarn(f); err == nil {
-                       t.Fatalf("Expected error, got %v", x)
-               }
-       }
-       <-done
-       if err != nil {
-               t.Fatal(err)
-       } else if matched, err := regexp.MatchString("^warning: read /proc/self/mem: .*", string(msg)); err != nil || !matched {
-               t.Fatalf("Expected error message about unreadable file, got \"%s\"", msg)
-       }
+type suite struct{}
+
+func (s *suite) TestReadAllOrWarnFail(c *C) {
+       var logger bytes.Buffer
+       rep := Reporter{Logger: log.New(&logger, "", 0)}
+
+       // The special file /proc/self/mem can be opened for
+       // reading, but reading from byte 0 returns an error.
+       f, err := os.Open("/proc/self/mem")
+       c.Assert(err, IsNil)
+       defer f.Close()
+       _, err = rep.readAllOrWarn(f)
+       c.Check(err, NotNil)
+       c.Check(logger.String(), Matches, "^warning: read /proc/self/mem: .*\n")
  }
  
-func TestReadAllOrWarnSuccess(t *testing.T) {
-       rep := Reporter{Logger: log.New(os.Stderr, "", 0)}
+func (s *suite) TestReadAllOrWarnSuccess(c *C) {
+       var logbuf bytes.Buffer
+       rep := Reporter{Logger: log.New(&logbuf, "", 0)}
  
         f, err := os.Open("./crunchstat_test.go")
-       if err != nil {
-               t.Fatalf("Opening ./crunchstat_test.go: %s", err)
-       }
+       c.Assert(err, IsNil)
+       defer f.Close()
         data, err := rep.readAllOrWarn(f)
-       if err != nil {
-               t.Fatalf("got error %s", err)
+       c.Check(err, IsNil)
+       c.Check(string(data), Matches, "(?ms).*\npackage crunchstat\n.*")
+       c.Check(logbuf.String(), Equals, "")
+}
+
+func (s *suite) TestReportPIDs(c *C) {
+       var logbuf bytes.Buffer
+       logger := logrus.New()
+       logger.Out = &logbuf
+       r := Reporter{
+               Logger:     logger,
+               CgroupRoot: "/sys/fs/cgroup",
+               PollPeriod: time.Second,
         }
-       if matched, err := regexp.MatchString("\npackage crunchstat\n", string(data)); err != nil || !matched {
-               t.Fatalf("data failed regexp: err %v, matched %v", err, matched)
+       r.Start()
+       r.ReportPID("init", 1)
+       r.ReportPID("test_process", os.Getpid())
+       r.ReportPID("nonexistent", 12345) // should be silently ignored/omitted
+       for deadline := time.Now().Add(10 * time.Second); ; time.Sleep(time.Millisecond) {
+               if time.Now().After(deadline) {
+                       c.Error("timed out")
+                       break
+               }
+               if m := regexp.MustCompile(`(?ms).*procmem \d+ init (\d+) test_process.*`).FindSubmatch(logbuf.Bytes()); len(m) > 0 {
+                       size, err := strconv.ParseInt(string(m[1]), 10, 64)
+                       c.Check(err, IsNil)
+                       // Expect >1 MiB and <100 MiB -- otherwise we
+                       // are probably misinterpreting /proc/N/stat
+                       // or multiplying by the wrong page size.
+                       c.Check(size > 1000000, Equals, true)
+                       c.Check(size < 100000000, Equals, true)
+                       break
+               }
         }
+       c.Logf("%s", logbuf.String())
  }
diff --git a/lib/ctrlctx/auth.go b/lib/ctrlctx/auth.go

new file mode 100644 (file)

index 0000000..f4c472f
--- /dev/null
+++ b/lib/ctrlctx/auth.go
@@ -0,0 +1,190 @@
+// Copyright (C) The Arvados Authors. All rights reserved.
+//
+// SPDX-License-Identifier: AGPL-3.0
+
+package ctrlctx
+
+import (
+       "context"
+       "crypto/hmac"
+       "crypto/sha256"
+       "database/sql"
+       "errors"
+       "fmt"
+       "io"
+       "strings"
+       "sync"
+       "time"
+
+       "git.arvados.org/arvados.git/lib/controller/api"
+       "git.arvados.org/arvados.git/sdk/go/arvados"
+       "git.arvados.org/arvados.git/sdk/go/auth"
+       "github.com/ghodss/yaml"
+)
+
+var (
+       ErrNoAuthContext   = errors.New("bug: there is no authorization in this context")
+       ErrUnauthenticated = errors.New("unauthenticated request")
+)
+
+// WrapCallsWithAuth returns a call wrapper (suitable for assigning to
+// router.router.WrapCalls) that makes CurrentUser(ctx) et al. work
+// from inside the wrapped functions.
+//
+// The incoming context must come from WrapCallsInTransactions or
+// NewWithTransaction.
+func WrapCallsWithAuth(cluster *arvados.Cluster) func(api.RoutableFunc) api.RoutableFunc {
+       var authcache authcache
+       return func(origFunc api.RoutableFunc) api.RoutableFunc {
+               return func(ctx context.Context, opts interface{}) (_ interface{}, err error) {
+                       var tokens []string
+                       if creds, ok := auth.FromContext(ctx); ok {
+                               tokens = creds.Tokens
+                       }
+                       return origFunc(context.WithValue(ctx, contextKeyAuth, &authcontext{
+                               authcache: &authcache,
+                               cluster:   cluster,
+                               tokens:    tokens,
+                       }), opts)
+               }
+       }
+}
+
+// CurrentAuth returns the arvados.User whose privileges should be
+// used in the given context, and the arvados.APIClientAuthorization
+// the caller presented in order to authenticate the current request.
+//
+// Returns ErrUnauthenticated if the current request was not
+// authenticated (no token provided, token is expired, etc).
+func CurrentAuth(ctx context.Context) (*arvados.User, *arvados.APIClientAuthorization, error) {
+       ac, ok := ctx.Value(contextKeyAuth).(*authcontext)
+       if !ok {
+               return nil, nil, ErrNoAuthContext
+       }
+       ac.lookupOnce.Do(func() {
+               // We only validate/lookup the token once per API
+               // call, even though authcache should be efficient
+               // enough to do a lookup each time. This guarantees we
+               // always return the same result when called multiple
+               // times in the course of handling a single API call.
+               for _, token := range ac.tokens {
+                       user, aca, err := ac.authcache.lookup(ctx, ac.cluster, token)
+                       if err != nil {
+                               ac.err = err
+                               return
+                       }
+                       if user != nil {
+                               ac.user, ac.apiClientAuthorization = user, aca
+                               return
+                       }
+               }
+               ac.err = ErrUnauthenticated
+       })
+       return ac.user, ac.apiClientAuthorization, ac.err
+}
+
+type contextKeyA string
+
+var contextKeyAuth = contextKeyT("auth")
+
+type authcontext struct {
+       authcache              *authcache
+       cluster                *arvados.Cluster
+       tokens                 []string
+       user                   *arvados.User
+       apiClientAuthorization *arvados.APIClientAuthorization
+       err                    error
+       lookupOnce             sync.Once
+}
+
+var authcacheTTL = time.Minute
+
+type authcacheent struct {
+       expireTime             time.Time
+       apiClientAuthorization arvados.APIClientAuthorization
+       user                   arvados.User
+}
+
+type authcache struct {
+       mtx         sync.Mutex
+       entries     map[string]*authcacheent
+       nextCleanup time.Time
+}
+
+// lookup returns the user and aca info for a given token. Returns nil
+// if the token is not valid. Returns a non-nil error if there was an
+// unexpected error from the database, etc.
+func (ac *authcache) lookup(ctx context.Context, cluster *arvados.Cluster, token string) (*arvados.User, *arvados.APIClientAuthorization, error) {
+       ac.mtx.Lock()
+       ent := ac.entries[token]
+       ac.mtx.Unlock()
+       if ent != nil && ent.expireTime.After(time.Now()) {
+               return &ent.user, &ent.apiClientAuthorization, nil
+       }
+       if token == "" {
+               return nil, nil, nil
+       }
+       tx, err := CurrentTx(ctx)
+       if err != nil {
+               return nil, nil, err
+       }
+       var aca arvados.APIClientAuthorization
+       var user arvados.User
+
+       var cond string
+       var args []interface{}
+       if len(token) > 30 && strings.HasPrefix(token, "v2/") && token[30] == '/' {
+               fields := strings.Split(token, "/")
+               cond = `aca.uuid = $1 and aca.api_token = $2`
+               args = []interface{}{fields[1], fields[2]}
+       } else {
+               // Bare token or OIDC access token
+               mac := hmac.New(sha256.New, []byte(cluster.SystemRootToken))
+               io.WriteString(mac, token)
+               hmac := fmt.Sprintf("%x", mac.Sum(nil))
+               cond = `aca.api_token in ($1, $2)`
+               args = []interface{}{token, hmac}
+       }
+       var expiresAt sql.NullTime
+       var scopesYAML []byte
+       err = tx.QueryRowContext(ctx, `
+select aca.uuid, aca.expires_at, aca.api_token, aca.scopes, users.uuid, users.is_active, users.is_admin
+ from api_client_authorizations aca
+ left join users on aca.user_id = users.id
+ where `+cond+`
+ and (expires_at is null or expires_at > current_timestamp at time zone 'UTC')`, args...).Scan(
+               &aca.UUID, &expiresAt, &aca.APIToken, &scopesYAML,
+               &user.UUID, &user.IsActive, &user.IsAdmin)
+       if err == sql.ErrNoRows {
+               return nil, nil, nil
+       } else if err != nil {
+               return nil, nil, err
+       }
+       aca.ExpiresAt = expiresAt.Time
+       if len(scopesYAML) > 0 {
+               err = yaml.Unmarshal(scopesYAML, &aca.Scopes)
+               if err != nil {
+                       return nil, nil, fmt.Errorf("loading scopes for %s: %w", aca.UUID, err)
+               }
+       }
+       ent = &authcacheent{
+               expireTime:             time.Now().Add(authcacheTTL),
+               apiClientAuthorization: aca,
+               user:                   user,
+       }
+       ac.mtx.Lock()
+       defer ac.mtx.Unlock()
+       if ac.entries == nil {
+               ac.entries = map[string]*authcacheent{}
+       }
+       if ac.nextCleanup.IsZero() || ac.nextCleanup.Before(time.Now()) {
+               for token, ent := range ac.entries {
+                       if !ent.expireTime.After(time.Now()) {
+                               delete(ac.entries, token)
+                       }
+               }
+               ac.nextCleanup = time.Now().Add(authcacheTTL)
+       }
+       ac.entries[token] = ent
+       return &ent.user, &ent.apiClientAuthorization, nil
+}
diff --git a/lib/ctrlctx/auth_test.go b/lib/ctrlctx/auth_test.go

new file mode 100644 (file)

index 0000000..e6803e5
--- /dev/null
+++ b/lib/ctrlctx/auth_test.go
@@ -0,0 +1,83 @@
+// Copyright (C) The Arvados Authors. All rights reserved.
+//
+// SPDX-License-Identifier: AGPL-3.0
+
+package ctrlctx
+
+import (
+       "context"
+
+       "git.arvados.org/arvados.git/lib/config"
+       "git.arvados.org/arvados.git/sdk/go/arvadostest"
+       "git.arvados.org/arvados.git/sdk/go/auth"
+       "git.arvados.org/arvados.git/sdk/go/ctxlog"
+       "github.com/jmoiron/sqlx"
+       _ "github.com/lib/pq"
+       check "gopkg.in/check.v1"
+)
+
+func (*DatabaseSuite) TestAuthContext(c *check.C) {
+       cfg, err := config.NewLoader(nil, ctxlog.TestLogger(c)).Load()
+       c.Assert(err, check.IsNil)
+       cluster, err := cfg.GetCluster("")
+       c.Assert(err, check.IsNil)
+
+       getter := func(context.Context) (*sqlx.DB, error) {
+               return sqlx.Open("postgres", cluster.PostgreSQL.Connection.String())
+       }
+       authwrapper := WrapCallsWithAuth(cluster)
+       dbwrapper := WrapCallsInTransactions(getter)
+
+       // valid tokens
+       for _, token := range []string{
+               arvadostest.ActiveToken,
+               arvadostest.ActiveTokenV2,
+               arvadostest.ActiveTokenV2 + "/asdfasdfasdf",
+               arvadostest.ActiveTokenV2, // cached
+       } {
+               ok, err := dbwrapper(authwrapper(func(ctx context.Context, opts interface{}) (interface{}, error) {
+                       user, aca, err := CurrentAuth(ctx)
+                       if c.Check(err, check.IsNil) {
+                               c.Check(user.UUID, check.Equals, "zzzzz-tpzed-xurymjxw79nv3jz")
+                               c.Check(aca.UUID, check.Equals, "zzzzz-gj3su-077z32aux8dg2s1")
+                               c.Check(aca.Scopes, check.DeepEquals, []string{"all"})
+                       }
+                       return true, nil
+               }))(auth.NewContext(context.Background(), auth.NewCredentials(token)), "blah")
+               c.Check(ok, check.Equals, true)
+               c.Check(err, check.IsNil)
+       }
+
+       // bad tokens
+       for _, token := range []string{
+               arvadostest.ActiveToken + "X",
+               arvadostest.ActiveTokenV2 + "X",
+               arvadostest.ActiveTokenV2[:30], // "v2/{uuid}"
+               arvadostest.ActiveTokenV2[:31], // "v2/{uuid}/"
+               "bogus",
+               "",
+       } {
+               ok, err := dbwrapper(authwrapper(func(ctx context.Context, opts interface{}) (interface{}, error) {
+                       user, aca, err := CurrentAuth(ctx)
+                       c.Check(err, check.Equals, ErrUnauthenticated)
+                       c.Check(user, check.IsNil)
+                       c.Check(aca, check.IsNil)
+                       return true, err
+               }))(auth.NewContext(context.Background(), auth.NewCredentials(token)), "blah")
+               c.Check(ok, check.Equals, true)
+               c.Check(err, check.Equals, ErrUnauthenticated)
+       }
+
+       // no auth context
+       {
+               ok, err := dbwrapper(authwrapper(func(ctx context.Context, opts interface{}) (interface{}, error) {
+                       user, aca, err := CurrentAuth(ctx)
+                       c.Check(err, check.Equals, ErrUnauthenticated)
+                       c.Check(user, check.IsNil)
+                       c.Check(aca, check.IsNil)
+                       return true, err
+               }))(context.Background(), "blah")
+               c.Check(ok, check.Equals, true)
+               c.Check(err, check.Equals, ErrUnauthenticated)
+       }
+}
diff --git a/lib/ctrlctx/db.go b/lib/ctrlctx/db.go

index 36d79d3d2ef89ac9819d12e3f4e2f175c96426bd..2a05096ce18b7430e7e1e487dd5d710024ac9193 100644 (file)
--- a/lib/ctrlctx/db.go
+++ b/lib/ctrlctx/db.go
@@ -10,8 +10,10 @@ import (
         "sync"
  
         "git.arvados.org/arvados.git/lib/controller/api"
+       "git.arvados.org/arvados.git/sdk/go/arvados"
         "git.arvados.org/arvados.git/sdk/go/ctxlog"
         "github.com/jmoiron/sqlx"
+
         // sqlx needs lib/pq to talk to PostgreSQL
         _ "github.com/lib/pq"
  )
@@ -107,6 +109,26 @@ func New(ctx context.Context, getdb func(context.Context) (*sqlx.DB, error)) (co
         }
  }
  
+// NewTx starts a new transaction. The caller is responsible for
+// calling Commit or Rollback. This is suitable for database queries
+// that are separate from the API transaction (see CurrentTx), e.g.,
+// ones that will be committed even if the API call fails, or held
+// open after the API call finishes.
+func NewTx(ctx context.Context) (*sqlx.Tx, error) {
+       txn, ok := ctx.Value(contextKeyTransaction).(*transaction)
+       if !ok {
+               return nil, ErrNoTransaction
+       }
+       db, err := txn.getdb(ctx)
+       if err != nil {
+               return nil, err
+       }
+       return db.Beginx()
+}
+
+// CurrentTx returns a transaction that will be committed after the
+// current API call completes, or rolled back if the current API call
+// returns an error.
  func CurrentTx(ctx context.Context) (*sqlx.Tx, error) {
         txn, ok := ctx.Value(contextKeyTransaction).(*transaction)
         if !ok {
@@ -121,3 +143,33 @@ func CurrentTx(ctx context.Context) (*sqlx.Tx, error) {
         })
         return txn.tx, txn.err
  }
+
+var errDBConnection = errors.New("database connection error")
+
+type DBConnector struct {
+       PostgreSQL arvados.PostgreSQL
+       pgdb       *sqlx.DB
+       mtx        sync.Mutex
+}
+
+func (dbc *DBConnector) GetDB(ctx context.Context) (*sqlx.DB, error) {
+       dbc.mtx.Lock()
+       defer dbc.mtx.Unlock()
+       if dbc.pgdb != nil {
+               return dbc.pgdb, nil
+       }
+       db, err := sqlx.Open("postgres", dbc.PostgreSQL.Connection.String())
+       if err != nil {
+               ctxlog.FromContext(ctx).WithError(err).Error("postgresql connect failed")
+               return nil, errDBConnection
+       }
+       if p := dbc.PostgreSQL.ConnectionPool; p > 0 {
+               db.SetMaxOpenConns(p)
+       }
+       if err := db.Ping(); err != nil {
+               ctxlog.FromContext(ctx).WithError(err).Error("postgresql connect succeeded but ping failed")
+               return nil, errDBConnection
+       }
+       dbc.pgdb = db
+       return db, nil
+}
diff --git a/lib/diagnostics/cmd.go b/lib/diagnostics/cmd.go

index 799abf9da4e278bc7f2f4150e7f284c991c677c4..ed963e1ef75b42439ed1e23fef7d11e9a62a695c 100644 (file)
--- a/lib/diagnostics/cmd.go
+++ b/lib/diagnostics/cmd.go
@@ -16,12 +16,15 @@ import (
         "net"
         "net/http"
         "net/url"
+       "os"
         "strings"
         "time"
  
         "git.arvados.org/arvados.git/lib/cmd"
+       "git.arvados.org/arvados.git/lib/config"
         "git.arvados.org/arvados.git/sdk/go/arvados"
         "git.arvados.org/arvados.git/sdk/go/ctxlog"
+       "git.arvados.org/arvados.git/sdk/go/health"
         "github.com/sirupsen/logrus"
  )
  
@@ -35,6 +38,7 @@ func (Command) RunCommand(prog string, args []string, stdin io.Reader, stdout, s
         f.StringVar(&diag.dockerImage, "docker-image", "", "image to use when running a test container (default: use embedded hello-world image)")
         f.BoolVar(&diag.checkInternal, "internal-client", false, "check that this host is considered an \"internal\" client")
         f.BoolVar(&diag.checkExternal, "external-client", false, "check that this host is considered an \"external\" client")
+       f.BoolVar(&diag.verbose, "v", false, "verbose: include more information in report")
         f.IntVar(&diag.priority, "priority", 500, "priority for test container (1..1000, or 0 to skip)")
         f.DurationVar(&diag.timeout, "timeout", 10*time.Second, "timeout for http requests")
         if ok, code := cmd.ParseFlags(f, prog, args, "", stderr); !ok {
@@ -58,6 +62,7 @@ func (Command) RunCommand(prog string, args []string, stdin io.Reader, stdout, s
  }
  
  // docker save hello-world > hello-world.tar
+//
  //go:embed hello-world.tar
  var HelloWorldDockerImage []byte
  
@@ -70,6 +75,7 @@ type diagnoser struct {
         dockerImage   string
         checkInternal bool
         checkExternal bool
+       verbose       bool
         timeout       time.Duration
         logger        *logrus.Logger
         errors        []string
@@ -84,6 +90,12 @@ func (diag *diagnoser) infof(f string, args ...interface{}) {
         diag.logger.Infof("  ... "+f, args...)
  }
  
+func (diag *diagnoser) verbosef(f string, args ...interface{}) {
+       if diag.verbose {
+               diag.logger.Infof("  ... "+f, args...)
+       }
+}
+
  func (diag *diagnoser) warnf(f string, args ...interface{}) {
         diag.logger.Warnf("  ... "+f, args...)
  }
@@ -125,6 +137,62 @@ func (diag *diagnoser) runtests() {
                 return
         }
  
+       hostname, err := os.Hostname()
+       if err != nil {
+               diag.warnf("error getting hostname: %s")
+       } else {
+               diag.verbosef("hostname = %s", hostname)
+       }
+
+       diag.dotest(5, "running health check (same as `arvados-server check`)", func() error {
+               ldr := config.NewLoader(&bytes.Buffer{}, ctxlog.New(&bytes.Buffer{}, "text", "info"))
+               ldr.SetupFlags(flag.NewFlagSet("diagnostics", flag.ContinueOnError))
+               cfg, err := ldr.Load()
+               if err != nil {
+                       diag.infof("skipping because config could not be loaded: %s", err)
+                       return nil
+               }
+               cluster, err := cfg.GetCluster("")
+               if err != nil {
+                       return err
+               }
+               if cluster.SystemRootToken != os.Getenv("ARVADOS_API_TOKEN") {
+                       return fmt.Errorf("diagnostics usage error: %s is readable but SystemRootToken does not match $ARVADOS_API_TOKEN (to fix, either run 'arvados-client sudo diagnostics' to load everything from config file, or set ARVADOS_CONFIG=- to load nothing from config file)", ldr.Path)
+               }
+               agg := &health.Aggregator{Cluster: cluster}
+               resp := agg.ClusterHealth()
+               for _, e := range resp.Errors {
+                       diag.errorf("health check: %s", e)
+               }
+               if len(resp.Errors) > 0 {
+                       diag.infof("consider running `arvados-server check -yaml` for a comprehensive report")
+               }
+               diag.verbosef("reported clock skew = %v", resp.ClockSkew)
+               reported := map[string]bool{}
+               for _, result := range resp.Checks {
+                       version := strings.SplitN(result.Metrics.Version, " (go", 2)[0]
+                       if version != "" && !reported[version] {
+                               diag.verbosef("arvados version = %s", version)
+                               reported[version] = true
+                       }
+               }
+               reported = map[string]bool{}
+               for _, result := range resp.Checks {
+                       if result.Server != "" && !reported[result.Server] {
+                               diag.verbosef("http frontend version = %s", result.Server)
+                               reported[result.Server] = true
+                       }
+               }
+               reported = map[string]bool{}
+               for _, result := range resp.Checks {
+                       if sha := result.ConfigSourceSHA256; sha != "" && !reported[sha] {
+                               diag.verbosef("config file sha256 = %s", sha)
+                               reported[sha] = true
+                       }
+               }
+               return nil
+       })
+
         var dd arvados.DiscoveryDocument
         ddpath := "discovery/v1/apis/arvados/v1/rest"
         diag.dotest(10, fmt.Sprintf("getting discovery document from https://%s/%s", client.APIHost, ddpath), func() error {
@@ -134,7 +202,7 @@ func (diag *diagnoser) runtests() {
                 if err != nil {
                         return err
                 }
-               diag.debugf("BlobSignatureTTL = %d", dd.BlobSignatureTTL)
+               diag.verbosef("BlobSignatureTTL = %d", dd.BlobSignatureTTL)
                 return nil
         })
  
@@ -148,7 +216,7 @@ func (diag *diagnoser) runtests() {
                 if err != nil {
                         return err
                 }
-               diag.debugf("Collections.BlobSigning = %v", cluster.Collections.BlobSigning)
+               diag.verbosef("Collections.BlobSigning = %v", cluster.Collections.BlobSigning)
                 cfgOK = true
                 return nil
         })
@@ -161,7 +229,7 @@ func (diag *diagnoser) runtests() {
                 if err != nil {
                         return err
                 }
-               diag.debugf("user uuid = %s", user.UUID)
+               diag.verbosef("user uuid = %s", user.UUID)
                 return nil
         })
  
@@ -250,9 +318,9 @@ func (diag *diagnoser) runtests() {
                 isInternal := found["proxy"] == 0 && len(keeplist.Items) > 0
                 isExternal := found["proxy"] > 0 && found["proxy"] == len(keeplist.Items)
                 if isExternal {
-                       diag.debugf("controller returned only proxy services, this host is treated as \"external\"")
+                       diag.infof("controller returned only proxy services, this host is treated as \"external\"")
                 } else if isInternal {
-                       diag.debugf("controller returned only non-proxy services, this host is treated as \"internal\"")
+                       diag.infof("controller returned only non-proxy services, this host is treated as \"internal\"")
                 }
                 if (diag.checkInternal && !isInternal) || (diag.checkExternal && !isExternal) {
                         return fmt.Errorf("expecting internal=%v external=%v, but found internal=%v external=%v", diag.checkInternal, diag.checkExternal, isInternal, isExternal)
@@ -329,7 +397,7 @@ func (diag *diagnoser) runtests() {
                 }
                 if len(grplist.Items) > 0 {
                         project = grplist.Items[0]
-                       diag.debugf("using existing project, uuid = %s", project.UUID)
+                       diag.verbosef("using existing project, uuid = %s", project.UUID)
                         return nil
                 }
                 diag.debugf("list groups: ok, no results")
@@ -340,7 +408,7 @@ func (diag *diagnoser) runtests() {
                 if err != nil {
                         return fmt.Errorf("create project: %s", err)
                 }
-               diag.debugf("created project, uuid = %s", project.UUID)
+               diag.verbosef("created project, uuid = %s", project.UUID)
                 return nil
         })
  
@@ -360,7 +428,7 @@ func (diag *diagnoser) runtests() {
                 if err != nil {
                         return err
                 }
-               diag.debugf("ok, uuid = %s", collection.UUID)
+               diag.verbosef("ok, uuid = %s", collection.UUID)
                 return nil
         })
  
@@ -630,17 +698,16 @@ func (diag *diagnoser) runtests() {
                 if err != nil {
                         return err
                 }
-               diag.debugf("container request uuid = %s", cr.UUID)
-               diag.debugf("container uuid = %s", cr.ContainerUUID)
+               diag.verbosef("container request uuid = %s", cr.UUID)
+               diag.verbosef("container uuid = %s", cr.ContainerUUID)
  
                 timeout := 10 * time.Minute
                 diag.infof("container request submitted, waiting up to %v for container to run", arvados.Duration(timeout))
-               ctx, cancel = context.WithDeadline(context.Background(), time.Now().Add(timeout))
-               defer cancel()
+               deadline := time.Now().Add(timeout)
  
                 var c arvados.Container
-               for ; cr.State != arvados.ContainerRequestStateFinal; time.Sleep(2 * time.Second) {
-                       ctx, cancel := context.WithDeadline(ctx, time.Now().Add(diag.timeout))
+               for ; cr.State != arvados.ContainerRequestStateFinal && time.Now().Before(deadline); time.Sleep(2 * time.Second) {
+                       ctx, cancel := context.WithDeadline(context.Background(), time.Now().Add(diag.timeout))
                         defer cancel()
  
                         crStateWas := cr.State
@@ -660,11 +727,26 @@ func (diag *diagnoser) runtests() {
                         if c.State != cStateWas {
                                 diag.debugf("container state = %s", c.State)
                         }
+
+                       cancel()
                 }
  
+               if cr.State != arvados.ContainerRequestStateFinal {
+                       err := client.RequestAndDecodeContext(context.Background(), &cr, "PATCH", "arvados/v1/container_requests/"+cr.UUID, nil, map[string]interface{}{
+                               "container_request": map[string]interface{}{
+                                       "priority": 0,
+                               }})
+                       if err != nil {
+                               diag.infof("error canceling container request %s: %s", cr.UUID, err)
+                       } else {
+                               diag.debugf("canceled container request %s", cr.UUID)
+                       }
+                       return fmt.Errorf("timed out waiting for container to finish; container request %s state was %q, container %s state was %q", cr.UUID, cr.State, c.UUID, c.State)
+               }
                 if c.State != arvados.ContainerStateComplete {
                         return fmt.Errorf("container request %s is final but container %s did not complete: container state = %q", cr.UUID, cr.ContainerUUID, c.State)
-               } else if c.ExitCode != 0 {
+               }
+               if c.ExitCode != 0 {
                         return fmt.Errorf("container exited %d", c.ExitCode)
                 }
                 return nil
diff --git a/lib/dispatchcloud/dispatcher.go b/lib/dispatchcloud/dispatcher.go

index ae91a710e395295f47a34cb5645f980021e79021..3403c50c972987e7f6f21a927a6db592fac9f6fc 100644 (file)
--- a/lib/dispatchcloud/dispatcher.go
+++ b/lib/dispatchcloud/dispatcher.go
@@ -15,6 +15,8 @@ import (
         "time"
  
         "git.arvados.org/arvados.git/lib/cloud"
+       "git.arvados.org/arvados.git/lib/controller/dblock"
+       "git.arvados.org/arvados.git/lib/ctrlctx"
         "git.arvados.org/arvados.git/lib/dispatchcloud/container"
         "git.arvados.org/arvados.git/lib/dispatchcloud/scheduler"
         "git.arvados.org/arvados.git/lib/dispatchcloud/sshexecutor"
@@ -53,6 +55,7 @@ type dispatcher struct {
         Registry      *prometheus.Registry
         InstanceSetID cloud.InstanceSetID
  
+       dbConnector ctrlctx.DBConnector
         logger      logrus.FieldLogger
         instanceSet cloud.InstanceSet
         pool        pool
@@ -118,6 +121,7 @@ func (disp *dispatcher) setup() {
  
  func (disp *dispatcher) initialize() {
         disp.logger = ctxlog.FromContext(disp.Context)
+       disp.dbConnector = ctrlctx.DBConnector{PostgreSQL: disp.Cluster.PostgreSQL}
  
         disp.ArvClient.AuthToken = disp.AuthToken
  
@@ -143,6 +147,7 @@ func (disp *dispatcher) initialize() {
         if err != nil {
                 disp.logger.Fatalf("error initializing driver: %s", err)
         }
+       dblock.Dispatch.Lock(disp.Context, disp.dbConnector.GetDB)
         disp.instanceSet = instanceSet
         disp.pool = worker.NewPool(disp.logger, disp.ArvClient, disp.Registry, disp.InstanceSetID, disp.instanceSet, disp.newExecutor, disp.sshKey.PublicKey(), disp.Cluster)
         disp.queue = container.NewQueue(disp.logger, disp.Registry, disp.typeChooser, disp.ArvClient)
@@ -175,6 +180,7 @@ func (disp *dispatcher) initialize() {
  }
  
  func (disp *dispatcher) run() {
+       defer dblock.Dispatch.Unlock()
         defer close(disp.stopped)
         defer disp.instanceSet.Stop()
         defer disp.pool.Stop()
diff --git a/lib/dispatchcloud/dispatcher_test.go b/lib/dispatchcloud/dispatcher_test.go

index 829a053636d5dc07abaac1c649810c5416e09fb6..2d486da5fd5a9d4aafbbc0b82f06d0c20c7f91e8 100644 (file)
--- a/lib/dispatchcloud/dispatcher_test.go
+++ b/lib/dispatchcloud/dispatcher_test.go
@@ -15,6 +15,7 @@ import (
         "sync"
         "time"
  
+       "git.arvados.org/arvados.git/lib/config"
         "git.arvados.org/arvados.git/lib/dispatchcloud/test"
         "git.arvados.org/arvados.git/sdk/go/arvados"
         "git.arvados.org/arvados.git/sdk/go/arvadostest"
@@ -49,8 +50,16 @@ func (s *DispatcherSuite) SetUpTest(c *check.C) {
                 MinTimeBetweenCreateCalls: time.Millisecond,
         }
  
+       // We need the postgresql connection info from the integration
+       // test config.
+       cfg, err := config.NewLoader(nil, ctxlog.FromContext(s.ctx)).Load()
+       c.Assert(err, check.IsNil)
+       testcluster, err := cfg.GetCluster("")
+       c.Assert(err, check.IsNil)
+
         s.cluster = &arvados.Cluster{
                 ManagementToken: "test-management-token",
+               PostgreSQL:      testcluster.PostgreSQL,
                 Containers: arvados.ContainersConfig{
                         CrunchRunCommand:       "crunch-run",
                         CrunchRunArgumentsList: []string{"--foo", "--extra='args'"},
@@ -184,12 +193,18 @@ func (s *DispatcherSuite) TestDispatchToStubDriver(c *check.C) {
         err := s.disp.CheckHealth()
         c.Check(err, check.IsNil)
  
-       select {
-       case <-done:
-               c.Logf("containers finished (%s), waiting for instances to shutdown and queue to clear", time.Since(start))
-       case <-time.After(10 * time.Second):
-               c.Fatalf("timed out; still waiting for %d containers: %q", len(waiting), waiting)
+       for len(waiting) > 0 {
+               waswaiting := len(waiting)
+               select {
+               case <-done:
+                       // loop will end because len(waiting)==0
+               case <-time.After(3 * time.Second):
+                       if len(waiting) >= waswaiting {
+                               c.Fatalf("timed out; no progress in 3s while waiting for %d containers: %q", len(waiting), waiting)
+                       }
+               }
         }
+       c.Logf("containers finished (%s), waiting for instances to shutdown and queue to clear", time.Since(start))
  
         deadline := time.Now().Add(5 * time.Second)
         for range time.NewTicker(10 * time.Millisecond).C {
diff --git a/lib/dispatchcloud/node_size.go b/lib/dispatchcloud/node_size.go

index 7c7643bfc7622fc8c876eba9c2e01d9203385074..0b394f4cfe4f76849fc2eb42541ed613e325921f 100644 (file)
--- a/lib/dispatchcloud/node_size.go
+++ b/lib/dispatchcloud/node_size.go
@@ -56,7 +56,7 @@ func estimateDockerImageSize(collectionPDH string) int64 {
  // EstimateScratchSpace estimates how much available disk space (in
  // bytes) is needed to run the container by summing the capacity
  // requested by 'tmp' mounts plus disk space required to load the
-// Docker image.
+// Docker image plus arv-mount block cache.
  func EstimateScratchSpace(ctr *arvados.Container) (needScratch int64) {
         for _, m := range ctr.Mounts {
                 if m.Kind == "tmp" {
@@ -80,6 +80,9 @@ func EstimateScratchSpace(ctr *arvados.Container) (needScratch int64) {
         // Now reserve space for the extracted image on disk.
         needScratch += dockerImageSize
  
+       // Now reserve space the arv-mount disk cache
+       needScratch += ctr.RuntimeConstraints.KeepCacheDisk
+
         return
  }
  
@@ -110,7 +113,12 @@ func ChooseInstanceType(cc *arvados.Cluster, ctr *arvados.Container) (best arvad
  
         needRAM := ctr.RuntimeConstraints.RAM + ctr.RuntimeConstraints.KeepCacheRAM
         needRAM += int64(cc.Containers.ReserveExtraRAM)
-       needRAM += int64(cc.Containers.LocalKeepBlobBuffersPerVCPU * needVCPUs * (1 << 26))
+       if cc.Containers.LocalKeepBlobBuffersPerVCPU > 0 {
+               // + 200 MiB for keepstore process + 10% for GOGC=10
+               needRAM += 220 << 20
+               // + 64 MiB for each blob buffer + 10% for GOGC=10
+               needRAM += int64(cc.Containers.LocalKeepBlobBuffersPerVCPU * needVCPUs * (1 << 26) * 11 / 10)
+       }
         needRAM = (needRAM * 100) / int64(100-discountConfiguredRAMPercent)
  
         ok := false
diff --git a/lib/dispatchcloud/node_size_test.go b/lib/dispatchcloud/node_size_test.go

index eb3648e8ac13265995bf98b040c47106ea380ea3..86bfbec7b629dc731e309740346dec85a24ae2d7 100644 (file)
--- a/lib/dispatchcloud/node_size_test.go
+++ b/lib/dispatchcloud/node_size_test.go
@@ -80,7 +80,10 @@ func (*NodeSizeSuite) TestChoose(c *check.C) {
                         "costly": {Price: 4.4, RAM: 4000000000, VCPUs: 8, Scratch: 2 * GiB, Name: "costly"},
                 },
         } {
-               best, err := ChooseInstanceType(&arvados.Cluster{InstanceTypes: menu, Containers: arvados.ContainersConfig{ReserveExtraRAM: 268435456}}, &arvados.Container{
+               best, err := ChooseInstanceType(&arvados.Cluster{InstanceTypes: menu, Containers: arvados.ContainersConfig{
+                       LocalKeepBlobBuffersPerVCPU: 1,
+                       ReserveExtraRAM:             268435456,
+               }}, &arvados.Container{
                         Mounts: map[string]arvados.Mount{
                                 "/tmp": {Kind: "tmp", Capacity: 2 * int64(GiB)},
                         },
@@ -98,7 +101,30 @@ func (*NodeSizeSuite) TestChoose(c *check.C) {
         }
  }
  
-func (*NodeSizeSuite) TestChoosePreemptable(c *check.C) {
+func (*NodeSizeSuite) TestChooseWithBlobBuffersOverhead(c *check.C) {
+       menu := map[string]arvados.InstanceType{
+               "nearly": {Price: 2.2, RAM: 4000000000, VCPUs: 4, Scratch: 2 * GiB, Name: "small"},
+               "best":   {Price: 3.3, RAM: 8000000000, VCPUs: 4, Scratch: 2 * GiB, Name: "best"},
+               "costly": {Price: 4.4, RAM: 12000000000, VCPUs: 8, Scratch: 2 * GiB, Name: "costly"},
+       }
+       best, err := ChooseInstanceType(&arvados.Cluster{InstanceTypes: menu, Containers: arvados.ContainersConfig{
+               LocalKeepBlobBuffersPerVCPU: 16, // 1 GiB per vcpu => 2 GiB
+               ReserveExtraRAM:             268435456,
+       }}, &arvados.Container{
+               Mounts: map[string]arvados.Mount{
+                       "/tmp": {Kind: "tmp", Capacity: 2 * int64(GiB)},
+               },
+               RuntimeConstraints: arvados.RuntimeConstraints{
+                       VCPUs:        2,
+                       RAM:          987654321,
+                       KeepCacheRAM: 123456789,
+               },
+       })
+       c.Check(err, check.IsNil)
+       c.Check(best.Name, check.Equals, "best")
+}
+
+func (*NodeSizeSuite) TestChoosePreemptible(c *check.C) {
         menu := map[string]arvados.InstanceType{
                 "costly":      {Price: 4.4, RAM: 4000000000, VCPUs: 8, Scratch: 2 * GiB, Preemptible: true, Name: "costly"},
                 "almost best": {Price: 2.2, RAM: 2000000000, VCPUs: 4, Scratch: 2 * GiB, Name: "almost best"},
diff --git a/lib/install/deps.go b/lib/install/deps.go

index e02c3743e71809a40053983d1e753e238577f2ec..1b4bf7266d29124dd56a92c9d9284828896cd706 100644 (file)
--- a/lib/install/deps.go
+++ b/lib/install/deps.go
@@ -30,18 +30,18 @@ import (
  
  var Command cmd.Handler = &installCommand{}
  
-const goversion = "1.17.7"
+const goversion = "1.18.8"
  
  const (
-       rubyversion             = "2.7.5"
+       rubyversion             = "2.7.6"
         bundlerversion          = "2.2.19"
         singularityversion      = "3.9.9"
         pjsversion              = "1.9.8"
         geckoversion            = "0.24.0"
         gradleversion           = "5.3.1"
-       nodejsversion           = "v12.22.11"
+       nodejsversion           = "v12.22.12"
         devtestDatabasePassword = "insecure_arvados_test"
-       workbench2version       = "2454ac35292a79594c32a80430740317ed5005cf"
+       workbench2version       = "e30e54d674c95ee15e296c71e471c1555bdc5a38" // 2.4.3
  )
  
  //go:embed arvados.service
@@ -155,17 +155,14 @@ func (inst *installCommand) RunCommand(prog string, args []string, stdin io.Read
                         "default-jre-headless",
                         "gettext",
                         "libattr1-dev",
-                       "libcrypt-ssleay-perl",
                         "libfuse-dev",
                         "libgbm1", // cypress / workbench2 tests
                         "libgnutls28-dev",
-                       "libjson-perl",
                         "libpam-dev",
                         "libpcre3-dev",
                         "libpq-dev",
                         "libreadline-dev",
                         "libssl-dev",
-                       "libwww-perl",
                         "libxml2-dev",
                         "libxslt1-dev",
                         "linkchecker",
@@ -206,11 +203,11 @@ func (inst *installCommand) RunCommand(prog string, args []string, stdin io.Read
                 }
                 switch {
                 case osv.Debian && osv.Major >= 11:
-                       pkgs = append(pkgs, "g++", "libcurl4", "libcurl4-openssl-dev", "perl-modules-5.32")
+                       pkgs = append(pkgs, "g++", "libcurl4", "libcurl4-openssl-dev")
                 case osv.Debian && osv.Major >= 10:
-                       pkgs = append(pkgs, "g++", "libcurl4", "libcurl4-openssl-dev", "perl-modules")
+                       pkgs = append(pkgs, "g++", "libcurl4", "libcurl4-openssl-dev")
                 case osv.Debian || osv.Ubuntu:
-                       pkgs = append(pkgs, "g++", "libcurl3", "libcurl3-openssl-dev", "perl-modules")
+                       pkgs = append(pkgs, "g++", "libcurl3", "libcurl3-openssl-dev")
                 case osv.Centos:
                         pkgs = append(pkgs, "gcc", "gcc-c++", "libcurl-devel", "postgresql-devel")
                 }
@@ -510,6 +507,7 @@ setcap "cap_sys_admin+pei cap_sys_chroot+pei" /var/lib/arvados/bin/nsenter
                 } else {
                         err = inst.runBash(`
  NJS=`+nodejsversion+`
+rm -rf /var/lib/arvados/node-*-linux-x64
  wget --progress=dot:giga -O- https://nodejs.org/dist/${NJS}/node-${NJS}-linux-x64.tar.xz | sudo tar -C /var/lib/arvados -xJf -
  ln -sfv /var/lib/arvados/node-${NJS}-linux-x64/bin/{node,npm} /usr/local/bin/
  `, stdout, stderr)
diff --git a/lib/lsf/dispatch.go b/lib/lsf/dispatch.go

index e2348337e62992eb4463947690e809e1927bb232..d1408d23cb1a4e3c2274f40d2f02b66bda29e82d 100644 (file)
--- a/lib/lsf/dispatch.go
+++ b/lib/lsf/dispatch.go
@@ -18,6 +18,8 @@ import (
         "time"
  
         "git.arvados.org/arvados.git/lib/cmd"
+       "git.arvados.org/arvados.git/lib/controller/dblock"
+       "git.arvados.org/arvados.git/lib/ctrlctx"
         "git.arvados.org/arvados.git/lib/dispatchcloud"
         "git.arvados.org/arvados.git/lib/service"
         "git.arvados.org/arvados.git/sdk/go/arvados"
@@ -58,6 +60,7 @@ type dispatcher struct {
         Registry  *prometheus.Registry
  
         logger        logrus.FieldLogger
+       dbConnector   ctrlctx.DBConnector
         lsfcli        lsfcli
         lsfqueue      lsfqueue
         arvDispatcher *dispatch.Dispatcher
@@ -73,7 +76,9 @@ type dispatcher struct {
  func (disp *dispatcher) Start() {
         disp.initOnce.Do(func() {
                 disp.init()
+               dblock.Dispatch.Lock(context.Background(), disp.dbConnector.GetDB)
                 go func() {
+                       defer dblock.Dispatch.Unlock()
                         disp.checkLsfQueueForOrphans()
                         err := disp.arvDispatcher.Run(disp.Context)
                         if err != nil {
@@ -125,6 +130,7 @@ func (disp *dispatcher) init() {
                 lsfcli: &disp.lsfcli,
         }
         disp.ArvClient.AuthToken = disp.AuthToken
+       disp.dbConnector = ctrlctx.DBConnector{PostgreSQL: disp.Cluster.PostgreSQL}
         disp.stop = make(chan struct{}, 1)
         disp.stopped = make(chan struct{})
  
@@ -170,6 +176,19 @@ func (disp *dispatcher) runContainer(_ *dispatch.Dispatcher, ctr arvados.Contain
         if ctr.State != dispatch.Locked {
                 // already started by prior invocation
         } else if _, ok := disp.lsfqueue.Lookup(ctr.UUID); !ok {
+               if _, err := dispatchcloud.ChooseInstanceType(disp.Cluster, &ctr); errors.As(err, &dispatchcloud.ConstraintsNotSatisfiableError{}) {
+                       err := disp.arvDispatcher.Arv.Update("containers", ctr.UUID, arvadosclient.Dict{
+                               "container": map[string]interface{}{
+                                       "runtime_status": map[string]string{
+                                               "error": err.Error(),
+                                       },
+                               },
+                       }, nil)
+                       if err != nil {
+                               return fmt.Errorf("error setting runtime_status on %s: %s", ctr.UUID, err)
+                       }
+                       return disp.arvDispatcher.UpdateState(ctr.UUID, dispatch.Cancelled)
+               }
                 disp.logger.Printf("Submitting container %s to LSF", ctr.UUID)
                 cmd := []string{disp.Cluster.Containers.CrunchRunCommand}
                 cmd = append(cmd, "--runtime-engine="+disp.Cluster.Containers.RuntimeEngine)
@@ -184,9 +203,8 @@ func (disp *dispatcher) runContainer(_ *dispatch.Dispatcher, ctr arvados.Contain
         defer disp.logger.Printf("Done monitoring container %s", ctr.UUID)
  
         go func(uuid string) {
-               cancelled := false
                 for ctx.Err() == nil {
-                       qent, ok := disp.lsfqueue.Lookup(uuid)
+                       _, ok := disp.lsfqueue.Lookup(uuid)
                         if !ok {
                                 // If the container disappears from
                                 // the lsf queue, there is no point in
@@ -196,25 +214,6 @@ func (disp *dispatcher) runContainer(_ *dispatch.Dispatcher, ctr arvados.Contain
                                 cancel()
                                 return
                         }
-                       if !cancelled && qent.Stat == "PEND" && strings.Contains(qent.PendReason, "There are no suitable hosts for the job") {
-                               disp.logger.Printf("container %s: %s", uuid, qent.PendReason)
-                               err := disp.arvDispatcher.Arv.Update("containers", uuid, arvadosclient.Dict{
-                                       "container": map[string]interface{}{
-                                               "runtime_status": map[string]string{
-                                                       "error": qent.PendReason,
-                                               },
-                                       },
-                               }, nil)
-                               if err != nil {
-                                       disp.logger.Printf("error setting runtime_status on %s: %s", uuid, err)
-                                       continue // retry
-                               }
-                               err = disp.arvDispatcher.UpdateState(uuid, dispatch.Cancelled)
-                               if err != nil {
-                                       continue // retry (UpdateState() already logged the error)
-                               }
-                               cancelled = true
-                       }
                 }
         }(ctr.UUID)
  
diff --git a/lib/lsf/dispatch_test.go b/lib/lsf/dispatch_test.go

index a99983f34a8ae4163f9a91ba59c43ab9e57c3e00..a381b25e9d075bc993f6327c579107025a62fe79 100644 (file)
--- a/lib/lsf/dispatch_test.go
+++ b/lib/lsf/dispatch_test.go
@@ -32,6 +32,7 @@ var _ = check.Suite(&suite{})
  type suite struct {
         disp          *dispatcher
         crTooBig      arvados.ContainerRequest
+       crPending     arvados.ContainerRequest
         crCUDARequest arvados.ContainerRequest
  }
  
@@ -44,8 +45,16 @@ func (s *suite) SetUpTest(c *check.C) {
         c.Assert(err, check.IsNil)
         cluster, err := cfg.GetCluster("")
         c.Assert(err, check.IsNil)
+       cluster.Containers.ReserveExtraRAM = 256 << 20
         cluster.Containers.CloudVMs.PollInterval = arvados.Duration(time.Second / 4)
         cluster.Containers.MinRetryPeriod = arvados.Duration(time.Second / 4)
+       cluster.InstanceTypes = arvados.InstanceTypeMap{
+               "biggest_available_node": arvados.InstanceType{
+                       RAM:             100 << 30, // 100 GiB
+                       VCPUs:           4,
+                       IncludedScratch: 100 << 30,
+                       Scratch:         100 << 30,
+               }}
         s.disp = newHandler(context.Background(), cluster, arvadostest.Dispatch1Token, prometheus.NewRegistry()).(*dispatcher)
         s.disp.lsfcli.stubCommand = func(string, ...string) *exec.Cmd {
                 return exec.Command("bash", "-c", "echo >&2 unimplemented stub; false")
@@ -67,6 +76,23 @@ func (s *suite) SetUpTest(c *check.C) {
         })
         c.Assert(err, check.IsNil)
  
+       err = arvados.NewClientFromEnv().RequestAndDecode(&s.crPending, "POST", "arvados/v1/container_requests", nil, map[string]interface{}{
+               "container_request": map[string]interface{}{
+                       "runtime_constraints": arvados.RuntimeConstraints{
+                               RAM:   100000000,
+                               VCPUs: 2,
+                       },
+                       "container_image":     arvadostest.DockerImage112PDH,
+                       "command":             []string{"sleep", "1"},
+                       "mounts":              map[string]arvados.Mount{"/mnt/out": {Kind: "tmp", Capacity: 1000}},
+                       "output_path":         "/mnt/out",
+                       "state":               arvados.ContainerRequestStateCommitted,
+                       "priority":            1,
+                       "container_count_max": 1,
+               },
+       })
+       c.Assert(err, check.IsNil)
+
         err = arvados.NewClientFromEnv().RequestAndDecode(&s.crCUDARequest, "POST", "arvados/v1/container_requests", nil, map[string]interface{}{
                 "container_request": map[string]interface{}{
                         "runtime_constraints": arvados.RuntimeConstraints{
@@ -150,15 +176,15 @@ func (stub lsfstub) stubCommand(s *suite, c *check.C) func(prog string, args ...
                                 fakejobq[nextjobid] = args[1]
                                 nextjobid++
                                 mtx.Unlock()
-                       case s.crTooBig.ContainerUUID:
+                       case s.crPending.ContainerUUID:
                                 c.Check(args, check.DeepEquals, []string{
-                                       "-J", s.crTooBig.ContainerUUID,
-                                       "-n", "1",
-                                       "-D", "954187MB",
-                                       "-R", "rusage[mem=954187MB:tmp=256MB] span[hosts=1]",
-                                       "-R", "select[mem>=954187MB]",
-                                       "-R", "select[tmp>=256MB]",
-                                       "-R", "select[ncpus>=1]"})
+                                       "-J", s.crPending.ContainerUUID,
+                                       "-n", "2",
+                                       "-D", "352MB",
+                                       "-R", "rusage[mem=352MB:tmp=8448MB] span[hosts=1]",
+                                       "-R", "select[mem>=352MB]",
+                                       "-R", "select[tmp>=8448MB]",
+                                       "-R", "select[ncpus>=2]"})
                                 mtx.Lock()
                                 fakejobq[nextjobid] = args[1]
                                 nextjobid++
@@ -187,7 +213,7 @@ func (stub lsfstub) stubCommand(s *suite, c *check.C) func(prog string, args ...
                         var records []map[string]interface{}
                         for jobid, uuid := range fakejobq {
                                 stat, reason := "RUN", ""
-                               if uuid == s.crTooBig.ContainerUUID {
+                               if uuid == s.crPending.ContainerUUID {
                                         // The real bjobs output includes a trailing ';' here:
                                         stat, reason = "PEND", "There are no suitable hosts for the job;"
                                 }
@@ -242,23 +268,28 @@ func (s *suite) TestSubmit(c *check.C) {
                         c.Error("timed out")
                         break
                 }
+               // "crTooBig" should never be submitted to lsf because
+               // it is bigger than any configured instance type
+               if ent, ok := s.disp.lsfqueue.Lookup(s.crTooBig.ContainerUUID); ok {
+                       c.Errorf("Lookup(crTooBig) == true, ent = %#v", ent)
+                       break
+               }
                 // "queuedcontainer" should be running
                 if _, ok := s.disp.lsfqueue.Lookup(arvadostest.QueuedContainerUUID); !ok {
                         c.Log("Lookup(queuedcontainer) == false")
                         continue
                 }
+               // "crPending" should be pending
+               if ent, ok := s.disp.lsfqueue.Lookup(s.crPending.ContainerUUID); !ok {
+                       c.Logf("Lookup(crPending) == false", ent)
+                       continue
+               }
                 // "lockedcontainer" should be cancelled because it
                 // has priority 0 (no matching container requests)
                 if ent, ok := s.disp.lsfqueue.Lookup(arvadostest.LockedContainerUUID); ok {
                         c.Logf("Lookup(lockedcontainer) == true, ent = %#v", ent)
                         continue
                 }
-               // "crTooBig" should be cancelled because lsf stub
-               // reports there is no suitable instance type
-               if ent, ok := s.disp.lsfqueue.Lookup(s.crTooBig.ContainerUUID); ok {
-                       c.Logf("Lookup(crTooBig) == true, ent = %#v", ent)
-                       continue
-               }
                 var ctr arvados.Container
                 if err := s.disp.arvDispatcher.Arv.Get("containers", arvadostest.LockedContainerUUID, nil, &ctr); err != nil {
                         c.Logf("error getting container state for %s: %s", arvadostest.LockedContainerUUID, err)
@@ -275,7 +306,7 @@ func (s *suite) TestSubmit(c *check.C) {
                         c.Logf("container %s is not in the LSF queue but its arvados record has not been updated to state==Cancelled (state is %q)", s.crTooBig.ContainerUUID, ctr.State)
                         continue
                 } else {
-                       c.Check(ctr.RuntimeStatus["error"], check.Equals, "There are no suitable hosts for the job;")
+                       c.Check(ctr.RuntimeStatus["error"], check.Equals, "constraints not satisfiable by any configured instance type")
                 }
                 c.Log("reached desired state")
                 break
diff --git a/lib/pam/testclient.go b/lib/pam/testclient.go

index 33bd47a35722edc6e68990ec48c1aa290619e8e1..02a278c0e60fa6aed88490b1de0461558532eb9b 100644 (file)
--- a/lib/pam/testclient.go
+++ b/lib/pam/testclient.go
@@ -76,7 +76,7 @@ func main() {
         }
         err = tx.Authenticate(pam.DisallowNullAuthtok)
         if err != nil {
-               err = fmt.Errorf("PAM: %s (message = %q)", err, errorMessage)
+               err = fmt.Errorf("PAM: %s (message = %q, sentPassword = %v)", err, errorMessage, sentPassword)
                 logrus.WithError(err).Print("authentication failed")
                 os.Exit(1)
         }
diff --git a/sdk/cwl/arvados_cwl/__init__.py b/sdk/cwl/arvados_cwl/__init__.py

index 08a05d571cb8e41bb48265489fcec9f13b1e6100..550ecba1c100c95df9fc5358564d6bcd4fe9bacc 100644 (file)
--- a/sdk/cwl/arvados_cwl/__init__.py
+++ b/sdk/cwl/arvados_cwl/__init__.py
@@ -36,6 +36,7 @@ from arvados.api import OrderedJsonModel
  from .perf import Perf
  from ._version import __version__
  from .executor import ArvCwlExecutor
+from .fsaccess import workflow_uuid_pattern
  
  # These aren't used directly in this file but
  # other code expects to import them from here
@@ -199,6 +200,10 @@ def arg_parser():  # type: () -> argparse.ArgumentParser
                          action="store_false", default=True,
                          help=argparse.SUPPRESS)
  
+    parser.add_argument("--disable-git", dest="git_info",
+                        action="store_false", default=True,
+                        help=argparse.SUPPRESS)
+
      parser.add_argument("--disable-color", dest="enable_color",
                          action="store_false", default=True,
                          help=argparse.SUPPRESS)
@@ -213,6 +218,15 @@ def arg_parser():  # type: () -> argparse.ArgumentParser
      parser.add_argument("--http-timeout", type=int,
                          default=5*60, dest="http_timeout", help="API request timeout in seconds. Default is 300 seconds (5 minutes).")
  
+    parser.add_argument("--defer-downloads", action="store_true", default=False,
+                        help="When submitting a workflow, defer downloading HTTP URLs to workflow launch instead of downloading to Keep before submit.")
+
+    parser.add_argument("--varying-url-params", type=str, default="",
+                        help="A comma separated list of URL query parameters that should be ignored when storing HTTP URLs in Keep.")
+
+    parser.add_argument("--prefer-cached-downloads", action="store_true", default=False,
+                        help="If a HTTP URL is found in Keep, skip upstream URL freshness check (will not notice if the upstream has changed, but also not error if upstream is unavailable).")
+
      exgroup = parser.add_mutually_exclusive_group()
      exgroup.add_argument("--enable-preemptible", dest="enable_preemptible", default=None, action="store_true", help="Use preemptible instances. Control individual steps with arv:UsePreemptible hint.")
      exgroup.add_argument("--disable-preemptible", dest="enable_preemptible", default=None, action="store_false", help="Don't use preemptible instances.")
@@ -319,7 +333,8 @@ def main(args=sys.argv[1:],
              # Make an API object now so errors are reported early.
              api_client.users().current().execute()
          if keep_client is None:
-            keep_client = arvados.keep.KeepClient(api_client=api_client, num_retries=4)
+            block_cache = arvados.keep.KeepBlockCache(disk_cache=True)
+            keep_client = arvados.keep.KeepClient(api_client=api_client, num_retries=4, block_cache=block_cache)
          executor = ArvCwlExecutor(api_client, arvargs, keep_client=keep_client, num_retries=4, stdout=stdout)
      except WorkflowException as e:
          logger.error(e, exc_info=(sys.exc_info()[1] if arvargs.debug else False))
@@ -359,6 +374,10 @@ def main(args=sys.argv[1:],
          # unit tests.
          stdout = None
  
+    if arvargs.submit and (arvargs.workflow.startswith("arvwf:") or workflow_uuid_pattern.match(arvargs.workflow)):
+        executor.loadingContext.do_validate = False
+        executor.fast_submit = True
+
      return cwltool.main.main(args=arvargs,
                               stdout=stdout,
                               stderr=stderr,
diff --git a/sdk/cwl/arvados_cwl/arvcontainer.py b/sdk/cwl/arvados_cwl/arvcontainer.py

index e9b58bc83b2fb4b655676acab301a6528f170a77..6fcf366e02aeed8aca3bc25a56d8562f0ba812f7 100644 (file)
--- a/sdk/cwl/arvados_cwl/arvcontainer.py
+++ b/sdk/cwl/arvados_cwl/arvcontainer.py
@@ -91,6 +91,8 @@ class ArvadosContainer(JobBase):
          container_request["state"] = "Committed"
          container_request.setdefault("properties", {})
  
+        container_request["properties"]["cwl_input"] = self.joborder
+
          runtime_constraints = {}
  
          if runtimeContext.project_uuid:
@@ -265,7 +267,11 @@ class ArvadosContainer(JobBase):
          runtime_req, _ = self.get_requirement("http://arvados.org/cwl#RuntimeConstraints")
          if runtime_req:
              if "keep_cache" in runtime_req:
-                runtime_constraints["keep_cache_ram"] = math.ceil(runtime_req["keep_cache"] * 2**20)
+                if self.arvrunner.api.config()["Containers"].get("DefaultKeepCacheDisk", 0) > 0:
+                    # If DefaultKeepCacheDisk is non-zero it means we should use disk cache.
+                    runtime_constraints["keep_cache_disk"] = math.ceil(runtime_req["keep_cache"] * 2**20)
+                else:
+                    runtime_constraints["keep_cache_ram"] = math.ceil(runtime_req["keep_cache"] * 2**20)
              if "outputDirType" in runtime_req:
                  if runtime_req["outputDirType"] == "local_output_dir":
                      # Currently the default behavior.
@@ -437,6 +443,13 @@ class ArvadosContainer(JobBase):
  
              if container["output"]:
                  outputs = done.done_outputs(self, container, "/tmp", self.outdir, "/keep")
+
+            properties = record["properties"].copy()
+            properties["cwl_output"] = outputs
+            self.arvrunner.api.container_requests().update(
+                uuid=self.uuid,
+                body={"container_request": {"properties": properties}}
+            ).execute(num_retries=self.arvrunner.num_retries)
          except WorkflowException as e:
              # Only include a stack trace if in debug mode.
              # A stack trace may obfuscate more useful output about the workflow.
@@ -514,6 +527,15 @@ class RunnerContainer(Runner):
                  "kind": "collection",
                  "portable_data_hash": "%s" % workflowcollection
              }
+        elif self.embedded_tool.tool.get("id", "").startswith("arvwf:"):
+            workflowpath = "/var/lib/cwl/workflow.json#main"
+            record = self.arvrunner.api.workflows().get(uuid=self.embedded_tool.tool["id"][6:33]).execute(num_retries=self.arvrunner.num_retries)
+            packed = yaml.safe_load(record["definition"])
+            container_req["mounts"]["/var/lib/cwl/workflow.json"] = {
+                "kind": "json",
+                "content": packed
+            }
+            container_req["properties"]["template_uuid"] = self.embedded_tool.tool["id"][6:33]
          else:
              packed = packed_workflow(self.arvrunner, self.embedded_tool, self.merged_map, runtimeContext, git_info)
              workflowpath = "/var/lib/cwl/workflow.json#main"
@@ -521,8 +543,6 @@ class RunnerContainer(Runner):
                  "kind": "json",
                  "content": packed
              }
-            if self.embedded_tool.tool.get("id", "").startswith("arvwf:"):
-                container_req["properties"]["template_uuid"] = self.embedded_tool.tool["id"][6:33]
  
          container_req["properties"].update({k.replace("http://arvados.org/cwl#", "arv:"): v for k, v in git_info.items()})
  
@@ -588,6 +608,12 @@ class RunnerContainer(Runner):
          if runtimeContext.enable_preemptible is False:
              command.append("--disable-preemptible")
  
+        if runtimeContext.varying_url_params:
+            command.append("--varying-url-params="+runtimeContext.varying_url_params)
+
+        if runtimeContext.prefer_cached_downloads:
+            command.append("--prefer-cached-downloads")
+
          command.extend([workflowpath, "/var/lib/cwl/cwl.input.json"])
  
          container_req["command"] = command
diff --git a/sdk/cwl/arvados_cwl/arvworkflow.py b/sdk/cwl/arvados_cwl/arvworkflow.py

index 5f3feabf8c83271ccec89d667d296663b86fecfa..56226388d7ab36618d1ff354c70d6bf512c18cea 100644 (file)
--- a/sdk/cwl/arvados_cwl/arvworkflow.py
+++ b/sdk/cwl/arvados_cwl/arvworkflow.py
@@ -13,6 +13,8 @@ import logging
  from schema_salad.sourceline import SourceLine, cmap
  import schema_salad.ref_resolver
  
+import arvados.collection
+
  from cwltool.pack import pack
  from cwltool.load_tool import fetch_document, resolve_and_validate_document
  from cwltool.process import shortname
@@ -37,6 +39,84 @@ metrics = logging.getLogger('arvados.cwl-runner.metrics')
  max_res_pars = ("coresMin", "coresMax", "ramMin", "ramMax", "tmpdirMin", "tmpdirMax")
  sum_res_pars = ("outdirMin", "outdirMax")
  
+def make_wrapper_workflow(arvRunner, main, packed, project_uuid, name, git_info, tool):
+    col = arvados.collection.Collection(api_client=arvRunner.api,
+                                        keep_client=arvRunner.keep_client)
+
+    with col.open("workflow.json", "wt") as f:
+        json.dump(packed, f, sort_keys=True, indent=4, separators=(',',': '))
+
+    pdh = col.portable_data_hash()
+
+    toolname = tool.tool.get("label") or tool.metadata.get("label") or os.path.basename(tool.tool["id"])
+    if git_info and git_info.get("http://arvados.org/cwl#gitDescribe"):
+        toolname = "%s (%s)" % (toolname, git_info.get("http://arvados.org/cwl#gitDescribe"))
+
+    existing = arvRunner.api.collections().list(filters=[["portable_data_hash", "=", pdh], ["owner_uuid", "=", project_uuid]]).execute(num_retries=arvRunner.num_retries)
+    if len(existing["items"]) == 0:
+        col.save_new(name=toolname, owner_uuid=project_uuid, ensure_unique_name=True)
+
+    # now construct the wrapper
+
+    step = {
+        "id": "#main/" + toolname,
+        "in": [],
+        "out": [],
+        "run": "keep:%s/workflow.json#main" % pdh,
+        "label": name
+    }
+
+    newinputs = []
+    for i in main["inputs"]:
+        inp = {}
+        # Make sure to only copy known fields that are meaningful at
+        # the workflow level. In practice this ensures that if we're
+        # wrapping a CommandLineTool we don't grab inputBinding.
+        # Right now also excludes extension fields, which is fine,
+        # Arvados doesn't currently look for any extension fields on
+        # input parameters.
+        for f in ("type", "label", "secondaryFiles", "streamable",
+                  "doc", "id", "format", "loadContents",
+                  "loadListing", "default"):
+            if f in i:
+                inp[f] = i[f]
+        newinputs.append(inp)
+
+    wrapper = {
+        "class": "Workflow",
+        "id": "#main",
+        "inputs": newinputs,
+        "outputs": [],
+        "steps": [step]
+    }
+
+    for i in main["inputs"]:
+        step["in"].append({
+            "id": "#main/step/%s" % shortname(i["id"]),
+            "source": i["id"]
+        })
+
+    for i in main["outputs"]:
+        step["out"].append({"id": "#main/step/%s" % shortname(i["id"])})
+        wrapper["outputs"].append({"outputSource": "#main/step/%s" % shortname(i["id"]),
+                                   "type": i["type"],
+                                   "id": i["id"]})
+
+    wrapper["requirements"] = [{"class": "SubworkflowFeatureRequirement"}]
+
+    if main.get("requirements"):
+        wrapper["requirements"].extend(main["requirements"])
+    if main.get("hints"):
+        wrapper["hints"] = main["hints"]
+
+    doc = {"cwlVersion": "v1.2", "$graph": [wrapper]}
+
+    if git_info:
+        for g in git_info:
+            doc[g] = git_info[g]
+
+    return json.dumps(doc, sort_keys=True, indent=4, separators=(',',': '))
+
  def upload_workflow(arvRunner, tool, job_order, project_uuid,
                      runtimeContext, uuid=None,
                      submit_runner_ram=0, name=None, merged_map=None,
@@ -84,11 +164,13 @@ def upload_workflow(arvRunner, tool, job_order, project_uuid,
  
      main["hints"] = hints
  
+    wrapper = make_wrapper_workflow(arvRunner, main, packed, project_uuid, name, git_info, tool)
+
      body = {
          "workflow": {
              "name": name,
              "description": tool.tool.get("doc", ""),
-            "definition":json.dumps(packed, sort_keys=True, indent=4, separators=(',',': '))
+            "definition": wrapper
          }}
      if project_uuid:
          body["workflow"]["owner_uuid"] = project_uuid
@@ -147,8 +229,13 @@ class ArvadosWorkflowStep(WorkflowStep):
                   **argv
                  ):  # type: (...) -> None
  
-        super(ArvadosWorkflowStep, self).__init__(toolpath_object, pos, loadingContext, *argc, **argv)
-        self.tool["class"] = "WorkflowStep"
+        if arvrunner.fast_submit:
+            self.tool = toolpath_object
+            self.tool["inputs"] = []
+            self.tool["outputs"] = []
+        else:
+            super(ArvadosWorkflowStep, self).__init__(toolpath_object, pos, loadingContext, *argc, **argv)
+            self.tool["class"] = "WorkflowStep"
          self.arvrunner = arvrunner
  
      def job(self, joborder, output_callback, runtimeContext):
diff --git a/sdk/cwl/arvados_cwl/context.py b/sdk/cwl/arvados_cwl/context.py

index 64f85e20763590fd173e57046f471f6e41602ac2..3ce561f66d3404e03c4aab19470439af22bf83dd 100644 (file)
--- a/sdk/cwl/arvados_cwl/context.py
+++ b/sdk/cwl/arvados_cwl/context.py
@@ -39,6 +39,9 @@ class ArvRuntimeContext(RuntimeContext):
          self.match_local_docker = False
          self.enable_preemptible = None
          self.copy_deps = None
+        self.defer_downloads = False
+        self.varying_url_params = ""
+        self.prefer_cached_downloads = False
  
          super(ArvRuntimeContext, self).__init__(kwargs)
  
diff --git a/sdk/cwl/arvados_cwl/executor.py b/sdk/cwl/arvados_cwl/executor.py

index 694f77baf246ecb56e6116e99dd5461deb9f6e53..447c14b8bfad4c8339addcbce9c6899aa2e06b72 100644 (file)
--- a/sdk/cwl/arvados_cwl/executor.py
+++ b/sdk/cwl/arvados_cwl/executor.py
@@ -70,6 +70,10 @@ class RuntimeStatusLoggingHandler(logging.Handler):
              kind = 'error'
          elif record.levelno >= logging.WARNING:
              kind = 'warning'
+        if kind == 'warning' and record.name == "salad":
+            # Don't send validation warnings to runtime status,
+            # they're noisy and unhelpful.
+            return
          if kind is not None and self.updatingRuntimeStatus is not True:
              self.updatingRuntimeStatus = True
              try:
@@ -112,6 +116,9 @@ class ArvCwlExecutor(object):
              arvargs.output_tags = None
              arvargs.thread_count = 1
              arvargs.collection_cache_size = None
+            arvargs.git_info = True
+            arvargs.submit = False
+            arvargs.defer_downloads = False
  
          self.api = api_client
          self.processes = {}
@@ -137,6 +144,8 @@ class ArvCwlExecutor(object):
          self.fs_access = None
          self.secret_store = None
          self.stdout = stdout
+        self.fast_submit = False
+        self.git_info = arvargs.git_info
  
          if keep_client is not None:
              self.keep_client = keep_client
@@ -203,6 +212,8 @@ The 'jobs' API is no longer supported.
          self.toplevel_runtimeContext.make_fs_access = partial(CollectionFsAccess,
                                                       collection_cache=self.collection_cache)
  
+        self.defer_downloads = arvargs.submit and arvargs.defer_downloads
+
          validate_cluster_target(self, self.toplevel_runtimeContext)
  
  
@@ -358,8 +369,8 @@ The 'jobs' API is no longer supported.
                      page = keys[:pageSize]
                      try:
                          proc_states = table.list(filters=[["uuid", "in", page]]).execute(num_retries=self.num_retries)
-                    except Exception:
-                        logger.exception("Error checking states on API server: %s")
+                    except Exception as e:
+                        logger.exception("Error checking states on API server: %s", e)
                          remain_wait = self.poll_interval
                          continue
  
@@ -582,7 +593,7 @@ The 'jobs' API is no longer supported.
      def arv_executor(self, updated_tool, job_order, runtimeContext, logger=None):
          self.debug = runtimeContext.debug
  
-        git_info = self.get_git_info(updated_tool)
+        git_info = self.get_git_info(updated_tool) if self.git_info else {}
          if git_info:
              logger.info("Git provenance")
              for g in git_info:
@@ -594,7 +605,8 @@ The 'jobs' API is no longer supported.
          controller = self.api.config()["Services"]["Controller"]["ExternalURL"]
          logger.info("Using cluster %s (%s)", self.api.config()["ClusterID"], workbench2 or workbench1 or controller)
  
-        updated_tool.visit(self.check_features)
+        if not self.fast_submit:
+            updated_tool.visit(self.check_features)
  
          self.pipeline = None
          self.fs_access = runtimeContext.make_fs_access(runtimeContext.basedir)
@@ -662,7 +674,7 @@ The 'jobs' API is no longer supported.
          loadingContext = self.loadingContext.copy()
          loadingContext.do_validate = False
          loadingContext.disable_js_validation = True
-        if submitting:
+        if submitting and not self.fast_submit:
              loadingContext.do_update = False
              # Document may have been auto-updated. Reload the original
              # document with updating disabled because we want to
@@ -675,9 +687,12 @@ The 'jobs' API is no longer supported.
  
          # Upload direct dependencies of workflow steps, get back mapping of files to keep references.
          # Also uploads docker images.
-        logger.info("Uploading workflow dependencies")
-        with Perf(metrics, "upload_workflow_deps"):
-            merged_map = upload_workflow_deps(self, tool, runtimeContext)
+        if not self.fast_submit:
+            logger.info("Uploading workflow dependencies")
+            with Perf(metrics, "upload_workflow_deps"):
+                merged_map = upload_workflow_deps(self, tool, runtimeContext)
+        else:
+            merged_map = {}
  
          # Recreate process object (ArvadosWorkflow or
          # ArvadosCommandTool) because tool document may have been
diff --git a/sdk/cwl/arvados_cwl/fsaccess.py b/sdk/cwl/arvados_cwl/fsaccess.py

index 4da8f855692aed44f212739d5e515af3fef2ceb0..5c09e671fa21eac1952c417e10580d332e3612be 100644 (file)
--- a/sdk/cwl/arvados_cwl/fsaccess.py
+++ b/sdk/cwl/arvados_cwl/fsaccess.py
@@ -244,10 +244,11 @@ class CollectionFetcher(DefaultFetcher):
          try:
              if url.startswith("http://arvados.org/cwl"):
                  return True
-            if url.startswith("keep:"):
-                return self.fsaccess.exists(url)
-            if url.startswith("arvwf:"):
-                if self.fetch_text(url):
+            urld, _ = urllib.parse.urldefrag(url)
+            if urld.startswith("keep:"):
+                return self.fsaccess.exists(urld)
+            if urld.startswith("arvwf:"):
+                if self.fetch_text(urld):
                      return True
          except arvados.errors.NotFoundError:
              return False
diff --git a/sdk/cwl/arvados_cwl/http.py b/sdk/cwl/arvados_cwl/http.py

index dcc2a51192dfc4d4b573da302b3373fd08d67fff..f2415bcffef40ef805b4e3a0213778caac16f63e 100644 (file)
--- a/sdk/cwl/arvados_cwl/http.py
+++ b/sdk/cwl/arvados_cwl/http.py
@@ -72,48 +72,104 @@ def remember_headers(url, properties, headers, now):
          properties[url]["Date"] = my_formatdate(now)
  
  
-def changed(url, properties, now):
+def changed(url, clean_url, properties, now):
      req = requests.head(url, allow_redirects=True)
-    remember_headers(url, properties, req.headers, now)
  
      if req.status_code != 200:
-        raise Exception("Got status %s" % req.status_code)
+        # Sometimes endpoints are misconfigured and will deny HEAD but
+        # allow GET so instead of failing here, we'll try GET If-None-Match
+        return True
  
-    pr = properties[url]
-    if "ETag" in pr and "ETag" in req.headers:
-        if pr["ETag"] == req.headers["ETag"]:
-            return False
+    etag = properties[url].get("ETag")
+
+    if url in properties:
+        del properties[url]
+    remember_headers(clean_url, properties, req.headers, now)
+
+    if "ETag" in req.headers and etag == req.headers["ETag"]:
+        # Didn't change
+        return False
  
      return True
  
-def http_to_keep(api, project_uuid, url, utcnow=datetime.datetime.utcnow):
-    r = api.collections().list(filters=[["properties", "exists", url]]).execute()
+def etag_quote(etag):
+    # if it already has leading and trailing quotes, do nothing
+    if etag[0] == '"' and etag[-1] == '"':
+        return etag
+    else:
+        # Add quotes.
+        return '"' + etag + '"'
+
+
+def http_to_keep(api, project_uuid, url, utcnow=datetime.datetime.utcnow, varying_url_params="", prefer_cached_downloads=False):
+    varying_params = [s.strip() for s in varying_url_params.split(",")]
+
+    parsed = urllib.parse.urlparse(url)
+    query = [q for q in urllib.parse.parse_qsl(parsed.query)
+             if q[0] not in varying_params]
+
+    clean_url = urllib.parse.urlunparse((parsed.scheme, parsed.netloc, parsed.path, parsed.params,
+                                         urllib.parse.urlencode(query, safe="/"),  parsed.fragment))
+
+    r1 = api.collections().list(filters=[["properties", "exists", url]]).execute()
+
+    if clean_url == url:
+        items = r1["items"]
+    else:
+        r2 = api.collections().list(filters=[["properties", "exists", clean_url]]).execute()
+        items = r1["items"] + r2["items"]
  
      now = utcnow()
  
-    for item in r["items"]:
+    etags = {}
+
+    for item in items:
          properties = item["properties"]
-        if fresh_cache(url, properties, now):
-            # Do nothing
+
+        if clean_url in properties:
+            cache_url = clean_url
+        elif url in properties:
+            cache_url = url
+        else:
+            return False
+
+        if prefer_cached_downloads or fresh_cache(cache_url, properties, now):
+            # HTTP caching rules say we should use the cache
              cr = arvados.collection.CollectionReader(item["portable_data_hash"], api_client=api)
              return "keep:%s/%s" % (item["portable_data_hash"], list(cr.keys())[0])
  
-        if not changed(url, properties, now):
+        if not changed(cache_url, clean_url, properties, now):
              # ETag didn't change, same content, just update headers
              api.collections().update(uuid=item["uuid"], body={"collection":{"properties": properties}}).execute()
              cr = arvados.collection.CollectionReader(item["portable_data_hash"], api_client=api)
              return "keep:%s/%s" % (item["portable_data_hash"], list(cr.keys())[0])
  
+        if "ETag" in properties[cache_url] and len(properties[cache_url]["ETag"]) > 2:
+            etags[properties[cache_url]["ETag"]] = item
+
+    logger.debug("Found ETags %s", etags)
+
      properties = {}
-    req = requests.get(url, stream=True, allow_redirects=True)
+    headers = {}
+    if etags:
+        headers['If-None-Match'] = ', '.join([etag_quote(k) for k,v in etags.items()])
+    logger.debug("Sending GET request with headers %s", headers)
+    req = requests.get(url, stream=True, allow_redirects=True, headers=headers)
  
-    if req.status_code != 200:
+    if req.status_code not in (200, 304):
          raise Exception("Failed to download '%s' got status %s " % (url, req.status_code))
  
-    remember_headers(url, properties, req.headers, now)
+    remember_headers(clean_url, properties, req.headers, now)
+
+    if req.status_code == 304 and "ETag" in req.headers and req.headers["ETag"] in etags:
+        item = etags[req.headers["ETag"]]
+        item["properties"].update(properties)
+        api.collections().update(uuid=item["uuid"], body={"collection":{"properties": item["properties"]}}).execute()
+        cr = arvados.collection.CollectionReader(item["portable_data_hash"], api_client=api)
+        return "keep:%s/%s" % (item["portable_data_hash"], list(cr.keys())[0])
  
-    if "Content-Length" in properties[url]:
-        cl = int(properties[url]["Content-Length"])
+    if "Content-Length" in properties[clean_url]:
+        cl = int(properties[clean_url]["Content-Length"])
          logger.info("Downloading %s (%s bytes)", url, cl)
      else:
          cl = None
@@ -128,7 +184,7 @@ def http_to_keep(api, project_uuid, url, utcnow=datetime.datetime.utcnow):
          else:
              name = grp.group(4)
      else:
-        name = urllib.parse.urlparse(url).path.split("/")[-1]
+        name = parsed.path.split("/")[-1]
  
      count = 0
      start = time.time()
@@ -149,8 +205,18 @@ def http_to_keep(api, project_uuid, url, utcnow=datetime.datetime.utcnow):
                      logger.info("%d downloaded, %3.2f MiB/s", count, (bps / (1024*1024)))
                  checkpoint = loopnow
  
+    logger.info("Download complete")
+
+    collectionname = "Downloaded from %s" % urllib.parse.quote(clean_url, safe='')
+
+    # max length - space to add a timestamp used by ensure_unique_name
+    max_name_len = 254 - 28
+
+    if len(collectionname) > max_name_len:
+        over = len(collectionname) - max_name_len
+        split = int(max_name_len/2)
+        collectionname = collectionname[0:split] + "…" + collectionname[split+over:]
  
-    collectionname = "Downloaded from %s" % urllib.parse.quote(url, safe='')
      c.save_new(name=collectionname, owner_uuid=project_uuid, ensure_unique_name=True)
  
      api.collections().update(uuid=c.manifest_locator(), body={"collection":{"properties": properties}}).execute()
diff --git a/sdk/cwl/arvados_cwl/pathmapper.py b/sdk/cwl/arvados_cwl/pathmapper.py

index 64fdfa0d04032e97235dc581144d9cb74494c597..e2e287bf1dbd9cbcfbe63275ae40087393bb1d1f 100644 (file)
--- a/sdk/cwl/arvados_cwl/pathmapper.py
+++ b/sdk/cwl/arvados_cwl/pathmapper.py
@@ -105,9 +105,15 @@ class ArvPathMapper(PathMapper):
                      raise WorkflowException("Directory literal '%s' is missing `listing`" % src)
              elif src.startswith("http:") or src.startswith("https:"):
                  try:
-                    keepref = http_to_keep(self.arvrunner.api, self.arvrunner.project_uuid, src)
-                    logger.info("%s is %s", src, keepref)
-                    self._pathmap[src] = MapperEnt(keepref, keepref, srcobj["class"], True)
+                    if self.arvrunner.defer_downloads:
+                        # passthrough, we'll download it later.
+                        self._pathmap[src] = MapperEnt(src, src, srcobj["class"], True)
+                    else:
+                        keepref = http_to_keep(self.arvrunner.api, self.arvrunner.project_uuid, src,
+                                               varying_url_params=self.arvrunner.toplevel_runtimeContext.varying_url_params,
+                                               prefer_cached_downloads=self.arvrunner.toplevel_runtimeContext.prefer_cached_downloads)
+                        logger.info("%s is %s", src, keepref)
+                        self._pathmap[src] = MapperEnt(keepref, keepref, srcobj["class"], True)
                  except Exception as e:
                      logger.warning(str(e))
              else:
@@ -156,6 +162,9 @@ class ArvPathMapper(PathMapper):
          if loc.startswith("_:"):
              return True
  
+        if self.arvrunner.defer_downloads and (loc.startswith("http:") or loc.startswith("https:")):
+            return False
+
          i = loc.rfind("/")
          if i > -1:
              loc_prefix = loc[:i+1]
diff --git a/sdk/cwl/arvados_cwl/runner.py b/sdk/cwl/arvados_cwl/runner.py

index 1544d05cd70660c6e046ef80073b7c80fb7c52c2..4861039198a18c36dbd0ae6d805be060cff1e224 100644 (file)
--- a/sdk/cwl/arvados_cwl/runner.py
+++ b/sdk/cwl/arvados_cwl/runner.py
@@ -53,13 +53,14 @@ from cwltool.command_line_tool import CommandLineTool
  import cwltool.workflow
  from cwltool.process import (scandeps, UnsupportedRequirement, normalizeFilesDirs,
                               shortname, Process, fill_in_defaults)
-from cwltool.load_tool import fetch_document
+from cwltool.load_tool import fetch_document, jobloaderctx
  from cwltool.utils import aslist, adjustFileObjs, adjustDirObjs, visit_class
  from cwltool.builder import substitute
  from cwltool.pack import pack
  from cwltool.update import INTERNAL_VERSION
  from cwltool.builder import Builder
  import schema_salad.validate as validate
+import schema_salad.ref_resolver
  
  import arvados.collection
  import arvados.util
@@ -694,9 +695,12 @@ def upload_job_order(arvrunner, name, tool, job_order, runtimeContext):
                               tool.tool["inputs"],
                               job_order)
  
+    _jobloaderctx = jobloaderctx.copy()
+    jobloader = schema_salad.ref_resolver.Loader(_jobloaderctx, fetcher_constructor=tool.doc_loader.fetcher_constructor)
+
      jobmapper = upload_dependencies(arvrunner,
                                      name,
-                                    tool.doc_loader,
+                                    jobloader,
                                      job_order,
                                      job_order.get("id", "#"),
                                      False,
@@ -724,28 +728,37 @@ def upload_workflow_deps(arvrunner, tool, runtimeContext):
  
      merged_map = {}
      tool_dep_cache = {}
+
+    todo = []
+
+    # Standard traversal is top down, we want to go bottom up, so use
+    # the visitor to accumalate a list of nodes to visit, then
+    # visit them in reverse order.
      def upload_tool_deps(deptool):
          if "id" in deptool:
-            discovered_secondaryfiles = {}
-            with Perf(metrics, "upload_dependencies %s" % shortname(deptool["id"])):
-                pm = upload_dependencies(arvrunner,
-                                         "%s dependencies" % (shortname(deptool["id"])),
-                                         document_loader,
-                                         deptool,
-                                         deptool["id"],
-                                         False,
-                                         runtimeContext,
-                                         include_primary=False,
-                                         discovered_secondaryfiles=discovered_secondaryfiles,
-                                         cache=tool_dep_cache)
-            document_loader.idx[deptool["id"]] = deptool
-            toolmap = {}
-            for k,v in pm.items():
-                toolmap[k] = v.resolved
-            merged_map[deptool["id"]] = FileUpdates(toolmap, discovered_secondaryfiles)
+            todo.append(deptool)
  
      tool.visit(upload_tool_deps)
  
+    for deptool in reversed(todo):
+        discovered_secondaryfiles = {}
+        with Perf(metrics, "upload_dependencies %s" % shortname(deptool["id"])):
+            pm = upload_dependencies(arvrunner,
+                                     "%s dependencies" % (shortname(deptool["id"])),
+                                     document_loader,
+                                     deptool,
+                                     deptool["id"],
+                                     False,
+                                     runtimeContext,
+                                     include_primary=False,
+                                     discovered_secondaryfiles=discovered_secondaryfiles,
+                                     cache=tool_dep_cache)
+        document_loader.idx[deptool["id"]] = deptool
+        toolmap = {}
+        for k,v in pm.items():
+            toolmap[k] = v.resolved
+        merged_map[deptool["id"]] = FileUpdates(toolmap, discovered_secondaryfiles)
+
      return merged_map
  
  def arvados_jobs_image(arvrunner, img, runtimeContext):
diff --git a/sdk/cwl/setup.py b/sdk/cwl/setup.py

index e70955c20bb9b359c2ff67db666209a3c99a74e8..e1a5077fb84c29e5b5a8a333a3bcacd1aaa4abd1 100644 (file)
--- a/sdk/cwl/setup.py
+++ b/sdk/cwl/setup.py
@@ -39,10 +39,11 @@ setup(name='arvados-cwl-runner',
            'cwltool==3.1.20220907141119',
            'schema-salad==8.3.20220913105718',
            'arvados-python-client{}'.format(pysdk_dep),
-          'setuptools',
            'ciso8601 >= 2.0.0',
            'networkx < 2.6',
-          'msgpack==1.0.3'
+          'msgpack==1.0.3',
+          'importlib-metadata<5',
+          'setuptools>=40.3.0'
        ],
        data_files=[
            ('share/doc/arvados-cwl-runner', ['LICENSE-2.0.txt', 'README.rst']),
diff --git a/sdk/cwl/tests/19678-name-id.cwl b/sdk/cwl/tests/19678-name-id.cwl

new file mode 100644 (file)

index 0000000..afed34b
--- /dev/null
+++ b/sdk/cwl/tests/19678-name-id.cwl
@@ -0,0 +1,26 @@
+# Copyright (C) The Arvados Authors. All rights reserved.
+#
+# SPDX-License-Identifier: Apache-2.0
+
+class: Workflow
+cwlVersion: v1.1
+inputs:
+  - type:
+      fields:
+        - name: first
+          type: string
+        - name: last
+          type: string
+      type: record
+    id: name
+outputs:
+  - type:
+      fields:
+        - name: first
+          type: string
+        - name: last
+          type: string
+      type: record
+    id: processed_name
+    outputSource: name
+steps: []
diff --git a/sdk/cwl/tests/arvados-tests.yml b/sdk/cwl/tests/arvados-tests.yml

index 2f309cfe81e6aae5a26ebacdea842d957d07ab0b..4ed4d4ac32fcc014dcdf57b592e1661bb1188926 100644 (file)
--- a/sdk/cwl/tests/arvados-tests.yml
+++ b/sdk/cwl/tests/arvados-tests.yml
@@ -469,3 +469,13 @@
    }
    tool: 19109-upload-secondary.cwl
    doc: "Test issue 19109 - correctly discover & upload secondary files"
+
+- job: 19678-name-id.yml
+  output: {
+    "processed_name": {
+        "first": "foo",
+        "last": "bar"
+    }
+  }
+  tool: 19678-name-id.cwl
+  doc: "Test issue 19678 - non-string type input parameter called 'name'"
diff --git a/sdk/cwl/tests/collection_per_tool/collection_per_tool_wrapper.cwl b/sdk/cwl/tests/collection_per_tool/collection_per_tool_wrapper.cwl

new file mode 100644 (file)

index 0000000..fda566c
--- /dev/null
+++ b/sdk/cwl/tests/collection_per_tool/collection_per_tool_wrapper.cwl
@@ -0,0 +1,35 @@
+# Copyright (C) The Arvados Authors. All rights reserved.
+#
+# SPDX-License-Identifier: Apache-2.0
+
+{
+    "$graph": [
+        {
+            "class": "Workflow",
+            "hints": [
+                {
+                    "acrContainerImage": "999999999999999999999999999999d3+99",
+                    "class": "http://arvados.org/cwl#WorkflowRunnerResources"
+                }
+            ],
+            "id": "#main",
+            "inputs": [],
+            "outputs": [],
+            "requirements": [
+                {
+                    "class": "SubworkflowFeatureRequirement"
+                }
+            ],
+            "steps": [
+                {
+                    "id": "#main/collection_per_tool.cwl",
+                    "in": [],
+                    "label": "collection_per_tool.cwl",
+                    "out": [],
+                    "run": "keep:92045991f69a417f2f26660db67911ef+61/workflow.json#main"
+                }
+            ]
+        }
+    ],
+    "cwlVersion": "v1.2"
+}
diff --git a/sdk/cwl/tests/test_container.py b/sdk/cwl/tests/test_container.py

index cb57b446da5877b4e74ef0b30ae7f930e37b0c12..75371e2b7856ffd36fdb51f8f7a69b4d89624d07 100644 (file)
--- a/sdk/cwl/tests/test_container.py
+++ b/sdk/cwl/tests/test_container.py
@@ -186,7 +186,7 @@ class TestContainer(unittest.TestCase):
                          'command': ['ls', '/var/spool/cwl'],
                          'cwd': '/var/spool/cwl',
                          'scheduling_parameters': {},
-                        'properties': {},
+                        'properties': {'cwl_input': {}},
                          'secret_mounts': {},
                          'output_storage_classes': ["default"]
                      }))
@@ -201,6 +201,7 @@ class TestContainer(unittest.TestCase):
          runner.intermediate_output_ttl = 3600
          runner.secret_store = cwltool.secrets.SecretStore()
          runner.api._rootDesc = {"revision": "20210628"}
+        runner.api.config.return_value = {"Containers": {"DefaultKeepCacheDisk": 0}}
  
          keepdocker.return_value = [("zzzzz-4zz18-zzzzzzzzzzzzzz3", "")]
          runner.api.collections().get().execute.return_value = {
@@ -277,7 +278,7 @@ class TestContainer(unittest.TestCase):
              'scheduling_parameters': {
                  'partitions': ['blurb']
              },
-            'properties': {},
+            'properties': {'cwl_input': {}},
              'secret_mounts': {},
              'output_storage_classes': ["default"]
          }
@@ -410,7 +411,7 @@ class TestContainer(unittest.TestCase):
              'cwd': '/var/spool/cwl',
              'scheduling_parameters': {
              },
-            'properties': {},
+            'properties': {'cwl_input': {}},
              'secret_mounts': {},
              'output_storage_classes': ["default"]
          }
@@ -497,7 +498,7 @@ class TestContainer(unittest.TestCase):
                      'command': ['ls', '/var/spool/cwl'],
                      'cwd': '/var/spool/cwl',
                      'scheduling_parameters': {},
-                    'properties': {},
+                    'properties': {'cwl_input': {}},
                      'secret_mounts': {},
                      'output_storage_classes': ["default"]
                  }))
@@ -534,6 +535,7 @@ class TestContainer(unittest.TestCase):
          arvjob.successCodes = [0]
          arvjob.outdir = "/var/spool/cwl"
          arvjob.output_ttl = 3600
+        arvjob.uuid = "zzzzz-xvhdp-zzzzzzzzzzzzzz1"
  
          arvjob.collect_outputs.return_value = {"out": "stuff"}
  
@@ -543,7 +545,8 @@ class TestContainer(unittest.TestCase):
              "output_uuid": "zzzzz-4zz18-zzzzzzzzzzzzzz2",
              "uuid": "zzzzz-xvhdp-zzzzzzzzzzzzzzz",
              "container_uuid": "zzzzz-8i9sb-zzzzzzzzzzzzzzz",
-            "modified_at": "2017-05-26T12:01:22Z"
+            "modified_at": "2017-05-26T12:01:22Z",
+            "properties": {}
          })
  
          self.assertFalse(api.collections().create.called)
@@ -553,6 +556,10 @@ class TestContainer(unittest.TestCase):
          arvjob.output_callback.assert_called_with({"out": "stuff"}, "success")
          runner.add_intermediate_output.assert_called_with("zzzzz-4zz18-zzzzzzzzzzzzzz2")
  
+        runner.api.container_requests().update.assert_called_with(uuid="zzzzz-xvhdp-zzzzzzzzzzzzzz1",
+                                                                  body={'container_request': {'properties': {'cwl_output': {'out': 'stuff'}}}})
+
+
      # Test to make sure we dont call runtime_status_update if we already did
      # some where higher up in the call stack
      @mock.patch("arvados_cwl.util.get_current_container")
@@ -636,7 +643,8 @@ class TestContainer(unittest.TestCase):
              "output_uuid": "zzzzz-4zz18-zzzzzzzzzzzzzz2",
              "uuid": "zzzzz-xvhdp-zzzzzzzzzzzzzzz",
              "container_uuid": "zzzzz-8i9sb-zzzzzzzzzzzzzzz",
-            "modified_at": "2017-05-26T12:01:22Z"
+            "modified_at": "2017-05-26T12:01:22Z",
+            "properties": {}
          })
  
          rts_mock.assert_called_with(
@@ -733,7 +741,38 @@ class TestContainer(unittest.TestCase):
                      'command': ['ls', '/var/spool/cwl'],
                      'cwd': '/var/spool/cwl',
                      'scheduling_parameters': {},
-                    'properties': {},
+                    'properties': {'cwl_input': {
+                        "p1": {
+                            "basename": "99999999999999999999999999999994+44",
+                            "class": "Directory",
+                            "dirname": "/keep",
+                            "http://arvados.org/cwl#collectionUUID": "zzzzz-4zz18-zzzzzzzzzzzzzzz",
+                            "listing": [
+                                {
+                                    "basename": "file1",
+                                    "class": "File",
+                                    "dirname": "/keep/99999999999999999999999999999994+44",
+                                    "location": "keep:99999999999999999999999999999994+44/file1",
+                                    "nameext": "",
+                                    "nameroot": "file1",
+                                    "path": "/keep/99999999999999999999999999999994+44/file1",
+                                    "size": 0
+                                },
+                                {
+                                    "basename": "file2",
+                                    "class": "File",
+                                    "dirname": "/keep/99999999999999999999999999999994+44",
+                                    "location": "keep:99999999999999999999999999999994+44/file2",
+                                    "nameext": "",
+                                    "nameroot": "file2",
+                                    "path": "/keep/99999999999999999999999999999994+44/file2",
+                                    "size": 0
+                                }
+                            ],
+                            "location": "keep:99999999999999999999999999999994+44",
+                            "path": "/keep/99999999999999999999999999999994+44"
+                        }
+                    }},
                      'secret_mounts': {},
                      'output_storage_classes': ["default"]
                  }))
@@ -827,7 +866,7 @@ class TestContainer(unittest.TestCase):
                      'command': ['md5sum', 'example.conf'],
                      'cwd': '/var/spool/cwl',
                      'scheduling_parameters': {},
-                    'properties': {},
+                    'properties': {'cwl_input': job_order},
                      "secret_mounts": {
                          "/var/spool/cwl/example.conf": {
                              "content": "username: user\npassword: blorp\n",
@@ -949,7 +988,7 @@ class TestContainer(unittest.TestCase):
                      'command': ['ls', '/var/spool/cwl'],
                      'cwd': '/var/spool/cwl',
                      'scheduling_parameters': {},
-                    'properties': {},
+                    'properties': {'cwl_input': {}},
                      'secret_mounts': {},
                      'output_storage_classes': ["foo_sc", "bar_sc"]
                  }))
@@ -1037,6 +1076,7 @@ class TestContainer(unittest.TestCase):
                      'scheduling_parameters': {},
                      'properties': {
                          "baz": "blorp",
+                        "cwl_input": {"x": "blorp"},
                          "foo": "bar",
                          "quux": {
                              "q1": 1,
@@ -1145,7 +1185,7 @@ class TestContainer(unittest.TestCase):
                          'command': ['nvidia-smi'],
                          'cwd': '/var/spool/cwl',
                          'scheduling_parameters': {},
-                        'properties': {},
+                        'properties': {'cwl_input': {}},
                          'secret_mounts': {},
                          'output_storage_classes': ["default"]
                      }))
@@ -1219,7 +1259,7 @@ class TestContainer(unittest.TestCase):
              'command': ['echo'],
              'cwd': '/var/spool/cwl',
              'scheduling_parameters': {},
-            'properties': {},
+            'properties': {'cwl_input': {}},
              'secret_mounts': {},
              'output_storage_classes': ["default"]
          }
@@ -1332,7 +1372,7 @@ class TestContainer(unittest.TestCase):
                              'command': ['ls', '/var/spool/cwl'],
                              'cwd': '/var/spool/cwl',
                              'scheduling_parameters': sched,
-                            'properties': {},
+                            'properties': {'cwl_input': {}},
                              'secret_mounts': {},
                              'output_storage_classes': ["default"]
                          }))
@@ -1521,7 +1561,19 @@ class TestWorkflow(unittest.TestCase):
                  "output_path": "/var/spool/cwl",
                  "output_ttl": 0,
                  "priority": 500,
-                "properties": {},
+                "properties": {'cwl_input': {
+                        "fileblub": {
+                            "basename": "token.txt",
+                            "class": "File",
+                            "dirname": "/keep/99999999999999999999999999999999+118",
+                            "location": "keep:99999999999999999999999999999999+118/token.txt",
+                            "nameext": ".txt",
+                            "nameroot": "token",
+                            "path": "/keep/99999999999999999999999999999999+118/token.txt",
+                            "size": 0
+                        },
+                        "sleeptime": 5
+                }},
                  "runtime_constraints": {
                      "ram": 1073741824,
                      "vcpus": 1
@@ -1594,7 +1646,7 @@ class TestWorkflow(unittest.TestCase):
                  'name': u'echo-subwf',
                  'secret_mounts': {},
                  'runtime_constraints': {'API': True, 'vcpus': 3, 'ram': 1073741824},
-                'properties': {},
+                'properties': {'cwl_input': {}},
                  'priority': 500,
                  'mounts': {
                      '/var/spool/cwl/cwl.input.yml': {
diff --git a/sdk/cwl/tests/test_http.py b/sdk/cwl/tests/test_http.py

index 650b5f0598514bbe9fd5ea0de96ab848d2375ad0..5598b1f1387a33a4c53d45eac5fe7dbc042dbeef 100644 (file)
--- a/sdk/cwl/tests/test_http.py
+++ b/sdk/cwl/tests/test_http.py
@@ -58,7 +58,7 @@ class TestHttpToKeep(unittest.TestCase):
          r = arvados_cwl.http.http_to_keep(api, None, "http://example.com/file1.txt", utcnow=utcnow)
          self.assertEqual(r, "keep:99999999999999999999999999999998+99/file1.txt")
  
-        getmock.assert_called_with("http://example.com/file1.txt", stream=True, allow_redirects=True)
+        getmock.assert_called_with("http://example.com/file1.txt", stream=True, allow_redirects=True, headers={})
  
          cm.open.assert_called_with("file1.txt", "wb")
          cm.save_new.assert_called_with(name="Downloaded from http%3A%2F%2Fexample.com%2Ffile1.txt",
@@ -186,7 +186,7 @@ class TestHttpToKeep(unittest.TestCase):
          r = arvados_cwl.http.http_to_keep(api, None, "http://example.com/file1.txt", utcnow=utcnow)
          self.assertEqual(r, "keep:99999999999999999999999999999997+99/file1.txt")
  
-        getmock.assert_called_with("http://example.com/file1.txt", stream=True, allow_redirects=True)
+        getmock.assert_called_with("http://example.com/file1.txt", stream=True, allow_redirects=True, headers={})
  
          cm.open.assert_called_with("file1.txt", "wb")
          cm.save_new.assert_called_with(name="Downloaded from http%3A%2F%2Fexample.com%2Ffile1.txt",
@@ -212,7 +212,7 @@ class TestHttpToKeep(unittest.TestCase):
                      'http://example.com/file1.txt': {
                          'Date': 'Tue, 15 May 2018 00:00:00 GMT',
                          'Expires': 'Tue, 16 May 2018 00:00:00 GMT',
-                        'ETag': '123456'
+                        'ETag': '"123456"'
                      }
                  }
              }]
@@ -229,7 +229,7 @@ class TestHttpToKeep(unittest.TestCase):
          req.headers = {
              'Date': 'Tue, 17 May 2018 00:00:00 GMT',
              'Expires': 'Tue, 19 May 2018 00:00:00 GMT',
-            'ETag': '123456'
+            'ETag': '"123456"'
          }
          headmock.return_value = req
  
@@ -247,7 +247,7 @@ class TestHttpToKeep(unittest.TestCase):
                        body={"collection":{"properties": {'http://example.com/file1.txt': {
                            'Date': 'Tue, 17 May 2018 00:00:00 GMT',
                            'Expires': 'Tue, 19 May 2018 00:00:00 GMT',
-                          'ETag': '123456'
+                          'ETag': '"123456"'
                        }}}})
                        ])
  
@@ -277,7 +277,7 @@ class TestHttpToKeep(unittest.TestCase):
          r = arvados_cwl.http.http_to_keep(api, None, "http://example.com/download?fn=/file1.txt", utcnow=utcnow)
          self.assertEqual(r, "keep:99999999999999999999999999999998+99/file1.txt")
  
-        getmock.assert_called_with("http://example.com/download?fn=/file1.txt", stream=True, allow_redirects=True)
+        getmock.assert_called_with("http://example.com/download?fn=/file1.txt", stream=True, allow_redirects=True, headers={})
  
          cm.open.assert_called_with("file1.txt", "wb")
          cm.save_new.assert_called_with(name="Downloaded from http%3A%2F%2Fexample.com%2Fdownload%3Ffn%3D%2Ffile1.txt",
@@ -287,3 +287,156 @@ class TestHttpToKeep(unittest.TestCase):
              mock.call(uuid=cm.manifest_locator(),
                        body={"collection":{"properties": {"http://example.com/download?fn=/file1.txt": {'Date': 'Tue, 15 May 2018 00:00:00 GMT'}}}})
          ])
+
+    @mock.patch("requests.get")
+    @mock.patch("requests.head")
+    @mock.patch("arvados.collection.CollectionReader")
+    def test_http_etag_if_none_match(self, collectionmock, headmock, getmock):
+        api = mock.MagicMock()
+
+        api.collections().list().execute.return_value = {
+            "items": [{
+                "uuid": "zzzzz-4zz18-zzzzzzzzzzzzzz3",
+                "portable_data_hash": "99999999999999999999999999999998+99",
+                "properties": {
+                    'http://example.com/file1.txt': {
+                        'Date': 'Tue, 15 May 2018 00:00:00 GMT',
+                        'Expires': 'Tue, 16 May 2018 00:00:00 GMT',
+                        'ETag': '"123456"'
+                    }
+                }
+            }]
+        }
+
+        cm = mock.MagicMock()
+        cm.manifest_locator.return_value = "zzzzz-4zz18-zzzzzzzzzzzzzz3"
+        cm.portable_data_hash.return_value = "99999999999999999999999999999998+99"
+        cm.keys.return_value = ["file1.txt"]
+        collectionmock.return_value = cm
+
+        # Head request fails, will try a conditional GET instead
+        req = mock.MagicMock()
+        req.status_code = 403
+        req.headers = {
+        }
+        headmock.return_value = req
+
+        utcnow = mock.MagicMock()
+        utcnow.return_value = datetime.datetime(2018, 5, 17)
+
+        req = mock.MagicMock()
+        req.status_code = 304
+        req.headers = {
+            'Date': 'Tue, 17 May 2018 00:00:00 GMT',
+            'Expires': 'Tue, 19 May 2018 00:00:00 GMT',
+            'ETag': '"123456"'
+        }
+        getmock.return_value = req
+
+        r = arvados_cwl.http.http_to_keep(api, None, "http://example.com/file1.txt", utcnow=utcnow)
+        self.assertEqual(r, "keep:99999999999999999999999999999998+99/file1.txt")
+
+        getmock.assert_called_with("http://example.com/file1.txt", stream=True, allow_redirects=True, headers={"If-None-Match": '"123456"'})
+        cm.open.assert_not_called()
+
+        api.collections().update.assert_has_calls([
+            mock.call(uuid=cm.manifest_locator(),
+                      body={"collection":{"properties": {'http://example.com/file1.txt': {
+                          'Date': 'Tue, 17 May 2018 00:00:00 GMT',
+                          'Expires': 'Tue, 19 May 2018 00:00:00 GMT',
+                          'ETag': '"123456"'
+                      }}}})
+                      ])
+
+
+    @mock.patch("requests.get")
+    @mock.patch("requests.head")
+    @mock.patch("arvados.collection.CollectionReader")
+    def test_http_prefer_cached_downloads(self, collectionmock, headmock, getmock):
+        api = mock.MagicMock()
+
+        api.collections().list().execute.return_value = {
+            "items": [{
+                "uuid": "zzzzz-4zz18-zzzzzzzzzzzzzz3",
+                "portable_data_hash": "99999999999999999999999999999998+99",
+                "properties": {
+                    'http://example.com/file1.txt': {
+                        'Date': 'Tue, 15 May 2018 00:00:00 GMT',
+                        'Expires': 'Tue, 16 May 2018 00:00:00 GMT',
+                        'ETag': '"123456"'
+                    }
+                }
+            }]
+        }
+
+        cm = mock.MagicMock()
+        cm.manifest_locator.return_value = "zzzzz-4zz18-zzzzzzzzzzzzzz3"
+        cm.portable_data_hash.return_value = "99999999999999999999999999999998+99"
+        cm.keys.return_value = ["file1.txt"]
+        collectionmock.return_value = cm
+
+        utcnow = mock.MagicMock()
+        utcnow.return_value = datetime.datetime(2018, 5, 17)
+
+        r = arvados_cwl.http.http_to_keep(api, None, "http://example.com/file1.txt", utcnow=utcnow, prefer_cached_downloads=True)
+        self.assertEqual(r, "keep:99999999999999999999999999999998+99/file1.txt")
+
+        headmock.assert_not_called()
+        getmock.assert_not_called()
+        cm.open.assert_not_called()
+        api.collections().update.assert_not_called()
+
+    @mock.patch("requests.get")
+    @mock.patch("requests.head")
+    @mock.patch("arvados.collection.CollectionReader")
+    def test_http_varying_url_params(self, collectionmock, headmock, getmock):
+        for prurl in ("http://example.com/file1.txt", "http://example.com/file1.txt?KeyId=123&Signature=456&Expires=789"):
+            api = mock.MagicMock()
+
+            api.collections().list().execute.return_value = {
+                "items": [{
+                    "uuid": "zzzzz-4zz18-zzzzzzzzzzzzzz3",
+                    "portable_data_hash": "99999999999999999999999999999998+99",
+                    "properties": {
+                        prurl: {
+                            'Date': 'Tue, 15 May 2018 00:00:00 GMT',
+                            'Expires': 'Tue, 16 May 2018 00:00:00 GMT',
+                            'ETag': '"123456"'
+                        }
+                    }
+                }]
+            }
+
+            cm = mock.MagicMock()
+            cm.manifest_locator.return_value = "zzzzz-4zz18-zzzzzzzzzzzzzz3"
+            cm.portable_data_hash.return_value = "99999999999999999999999999999998+99"
+            cm.keys.return_value = ["file1.txt"]
+            collectionmock.return_value = cm
+
+            req = mock.MagicMock()
+            req.status_code = 200
+            req.headers = {
+                'Date': 'Tue, 17 May 2018 00:00:00 GMT',
+                'Expires': 'Tue, 19 May 2018 00:00:00 GMT',
+                'ETag': '"123456"'
+            }
+            headmock.return_value = req
+
+            utcnow = mock.MagicMock()
+            utcnow.return_value = datetime.datetime(2018, 5, 17)
+
+            r = arvados_cwl.http.http_to_keep(api, None, "http://example.com/file1.txt?KeyId=123&Signature=456&Expires=789",
+                                              utcnow=utcnow, varying_url_params="KeyId,Signature,Expires")
+            self.assertEqual(r, "keep:99999999999999999999999999999998+99/file1.txt")
+
+            getmock.assert_not_called()
+            cm.open.assert_not_called()
+
+            api.collections().update.assert_has_calls([
+                mock.call(uuid=cm.manifest_locator(),
+                          body={"collection":{"properties": {'http://example.com/file1.txt': {
+                              'Date': 'Tue, 17 May 2018 00:00:00 GMT',
+                              'Expires': 'Tue, 19 May 2018 00:00:00 GMT',
+                              'ETag': '"123456"'
+                          }}}})
+                          ])
diff --git a/sdk/cwl/tests/test_submit.py b/sdk/cwl/tests/test_submit.py

index b44f6feb5d28db91d38bcc25105c5b2adc513b95..dcbee726b6ce4962692d8255d7be2b41b76c5f09 100644 (file)
--- a/sdk/cwl/tests/test_submit.py
+++ b/sdk/cwl/tests/test_submit.py
@@ -290,13 +290,13 @@ def stubs(wfdetails=('submit_wf.cwl', None)):
              gitinfo_workflow["$graph"][0]["id"] = "file://%s/tests/wf/%s" % (cwd, wfpath)
              mocktool = mock.NonCallableMock(tool=gitinfo_workflow["$graph"][0], metadata=gitinfo_workflow)
  
-            git_info = arvados_cwl.executor.ArvCwlExecutor.get_git_info(mocktool)
-            expect_packed_workflow.update(git_info)
+            stubs.git_info = arvados_cwl.executor.ArvCwlExecutor.get_git_info(mocktool)
+            expect_packed_workflow.update(stubs.git_info)
  
-            git_props = {"arv:"+k.split("#", 1)[1]: v for k,v in git_info.items()}
+            stubs.git_props = {"arv:"+k.split("#", 1)[1]: v for k,v in stubs.git_info.items()}
  
              if wfname == wfpath:
-                container_name = "%s (%s)" % (wfpath, git_props["arv:gitDescribe"])
+                container_name = "%s (%s)" % (wfpath, stubs.git_props["arv:gitDescribe"])
              else:
                  container_name = wfname
  
@@ -359,7 +359,7 @@ def stubs(wfdetails=('submit_wf.cwl', None)):
                      'ram': (1024+256)*1024*1024
                  },
                  'use_existing': False,
-                'properties': git_props,
+                'properties': stubs.git_props,
                  'secret_mounts': {}
              }
  
@@ -393,7 +393,7 @@ class TestSubmit(unittest.TestCase):
          root_logger.handlers = handlers
  
      @mock.patch("time.sleep")
-    @stubs
+    @stubs()
      def test_submit_invalid_runner_ram(self, stubs, tm):
          exited = arvados_cwl.main(
              ["--submit", "--no-wait", "--debug", "--submit-runner-ram=-2048",
@@ -402,7 +402,7 @@ class TestSubmit(unittest.TestCase):
          self.assertEqual(exited, 1)
  
  
-    @stubs
+    @stubs()
      def test_submit_container(self, stubs):
          exited = arvados_cwl.main(
              ["--submit", "--no-wait", "--api=containers", "--debug",
@@ -414,7 +414,7 @@ class TestSubmit(unittest.TestCase):
                  'manifest_text':
                  '. 979af1245a12a1fed634d4222473bfdc+16 0:16:blorp.txt\n',
                  'replication_desired': None,
-                'name': 'submit_wf.cwl input (169f39d466a5438ac4a90e779bf750c7+53)',
+                'name': 'submit_wf.cwl ('+ stubs.git_props["arv:gitDescribe"] +') input (169f39d466a5438ac4a90e779bf750c7+53)',
              }), ensure_unique_name=False),
              mock.call(body=JsonDiffMatcher({
                  'manifest_text':
@@ -432,7 +432,7 @@ class TestSubmit(unittest.TestCase):
          self.assertEqual(exited, 0)
  
  
-    @stubs
+    @stubs()
      def test_submit_container_tool(self, stubs):
          # test for issue #16139
          exited = arvados_cwl.main(
@@ -444,7 +444,7 @@ class TestSubmit(unittest.TestCase):
                           stubs.expect_container_request_uuid + '\n')
          self.assertEqual(exited, 0)
  
-    @stubs
+    @stubs()
      def test_submit_container_no_reuse(self, stubs):
          exited = arvados_cwl.main(
              ["--submit", "--no-wait", "--api=containers", "--debug", "--disable-reuse",
@@ -457,7 +457,7 @@ class TestSubmit(unittest.TestCase):
              '--no-log-timestamps', '--disable-validate', '--disable-color',
              '--eval-timeout=20', '--thread-count=0',
              '--disable-reuse', "--collection-cache-size=256",
-            "--output-name=Output from workflow submit_wf.cwl",
+            '--output-name=Output from workflow submit_wf.cwl (%s)' % stubs.git_props["arv:gitDescribe"],
              '--debug', '--on-error=continue',
              '/var/lib/cwl/workflow.json#main', '/var/lib/cwl/cwl.input.json']
          expect_container["use_existing"] = False
@@ -496,7 +496,7 @@ class TestSubmit(unittest.TestCase):
                           stubs.expect_container_request_uuid + '\n')
  
  
-    @stubs
+    @stubs()
      def test_submit_container_on_error(self, stubs):
          exited = arvados_cwl.main(
              ["--submit", "--no-wait", "--api=containers", "--debug", "--on-error=stop",
@@ -508,7 +508,7 @@ class TestSubmit(unittest.TestCase):
                                         '--no-log-timestamps', '--disable-validate', '--disable-color',
                                         '--eval-timeout=20', '--thread-count=0',
                                         '--enable-reuse', "--collection-cache-size=256",
-                                       "--output-name=Output from workflow submit_wf.cwl",
+                                       '--output-name=Output from workflow submit_wf.cwl (%s)' % stubs.git_props["arv:gitDescribe"],
                                         '--debug', '--on-error=stop',
                                         '/var/lib/cwl/workflow.json#main', '/var/lib/cwl/cwl.input.json']
  
@@ -518,7 +518,7 @@ class TestSubmit(unittest.TestCase):
                           stubs.expect_container_request_uuid + '\n')
          self.assertEqual(exited, 0)
  
-    @stubs
+    @stubs()
      def test_submit_container_output_name(self, stubs):
          output_name = "test_output_name"
  
@@ -542,7 +542,7 @@ class TestSubmit(unittest.TestCase):
                           stubs.expect_container_request_uuid + '\n')
          self.assertEqual(exited, 0)
  
-    @stubs
+    @stubs()
      def test_submit_storage_classes(self, stubs):
          exited = arvados_cwl.main(
              ["--debug", "--submit", "--no-wait", "--api=containers", "--storage-classes=foo",
@@ -554,7 +554,7 @@ class TestSubmit(unittest.TestCase):
                                         '--no-log-timestamps', '--disable-validate', '--disable-color',
                                         '--eval-timeout=20', '--thread-count=0',
                                         '--enable-reuse', "--collection-cache-size=256",
-                                       '--output-name=Output from workflow submit_wf.cwl',
+                                       '--output-name=Output from workflow submit_wf.cwl (%s)' % stubs.git_props["arv:gitDescribe"],
                                         "--debug",
                                         "--storage-classes=foo", '--on-error=continue',
                                         '/var/lib/cwl/workflow.json#main', '/var/lib/cwl/cwl.input.json']
@@ -565,7 +565,7 @@ class TestSubmit(unittest.TestCase):
                           stubs.expect_container_request_uuid + '\n')
          self.assertEqual(exited, 0)
  
-    @stubs
+    @stubs()
      def test_submit_multiple_storage_classes(self, stubs):
          exited = arvados_cwl.main(
              ["--debug", "--submit", "--no-wait", "--api=containers", "--storage-classes=foo,bar", "--intermediate-storage-classes=baz",
@@ -577,7 +577,7 @@ class TestSubmit(unittest.TestCase):
                                         '--no-log-timestamps', '--disable-validate', '--disable-color',
                                         '--eval-timeout=20', '--thread-count=0',
                                         '--enable-reuse', "--collection-cache-size=256",
-                                       "--output-name=Output from workflow submit_wf.cwl",
+                                       '--output-name=Output from workflow submit_wf.cwl (%s)' % stubs.git_props["arv:gitDescribe"],
                                         "--debug",
                                         "--storage-classes=foo,bar", "--intermediate-storage-classes=baz", '--on-error=continue',
                                         '/var/lib/cwl/workflow.json#main', '/var/lib/cwl/cwl.input.json']
@@ -591,7 +591,7 @@ class TestSubmit(unittest.TestCase):
      @mock.patch("cwltool.task_queue.TaskQueue")
      @mock.patch("arvados_cwl.arvworkflow.ArvadosWorkflow.job")
      @mock.patch("arvados_cwl.executor.ArvCwlExecutor.make_output_collection")
-    @stubs
+    @stubs()
      def test_storage_classes_correctly_propagate_to_make_output_collection(self, stubs, make_output, job, tq):
          final_output_c = arvados.collection.Collection()
          make_output.return_value = ({},final_output_c)
@@ -602,17 +602,17 @@ class TestSubmit(unittest.TestCase):
          job.side_effect = set_final_output
  
          exited = arvados_cwl.main(
-            ["--debug", "--local", "--storage-classes=foo",
+            ["--debug", "--local", "--storage-classes=foo", "--disable-git",
                  "tests/wf/submit_wf.cwl", "tests/submit_test_job.json"],
              stubs.capture_stdout, sys.stderr, api_client=stubs.api, keep_client=stubs.keep_client)
  
-        make_output.assert_called_with(u'Output of submit_wf.cwl', ['foo'], '', {}, {"out": "zzzzz"})
+        make_output.assert_called_with(u'Output from workflow submit_wf.cwl', ['foo'], '', {}, {"out": "zzzzz"})
          self.assertEqual(exited, 0)
  
      @mock.patch("cwltool.task_queue.TaskQueue")
      @mock.patch("arvados_cwl.arvworkflow.ArvadosWorkflow.job")
      @mock.patch("arvados_cwl.executor.ArvCwlExecutor.make_output_collection")
-    @stubs
+    @stubs()
      def test_default_storage_classes_correctly_propagate_to_make_output_collection(self, stubs, make_output, job, tq):
          final_output_c = arvados.collection.Collection()
          make_output.return_value = ({},final_output_c)
@@ -624,17 +624,17 @@ class TestSubmit(unittest.TestCase):
          job.side_effect = set_final_output
  
          exited = arvados_cwl.main(
-            ["--debug", "--local",
+            ["--debug", "--local", "--disable-git",
                  "tests/wf/submit_wf.cwl", "tests/submit_test_job.json"],
              stubs.capture_stdout, sys.stderr, api_client=stubs.api, keep_client=stubs.keep_client)
  
-        make_output.assert_called_with(u'Output of submit_wf.cwl', ['default'], '', {}, {"out": "zzzzz"})
+        make_output.assert_called_with(u'Output from workflow submit_wf.cwl', ['default'], '', {}, {"out": "zzzzz"})
          self.assertEqual(exited, 0)
  
      @mock.patch("cwltool.task_queue.TaskQueue")
      @mock.patch("arvados_cwl.arvworkflow.ArvadosWorkflow.job")
      @mock.patch("arvados_cwl.executor.ArvCwlExecutor.make_output_collection")
-    @stubs
+    @stubs()
      def test_storage_class_hint_to_make_output_collection(self, stubs, make_output, job, tq):
          final_output_c = arvados.collection.Collection()
          make_output.return_value = ({},final_output_c)
@@ -645,14 +645,14 @@ class TestSubmit(unittest.TestCase):
          job.side_effect = set_final_output
  
          exited = arvados_cwl.main(
-            ["--debug", "--local",
+            ["--debug", "--local", "--disable-git",
                  "tests/wf/submit_storage_class_wf.cwl", "tests/submit_test_job.json"],
              stubs.capture_stdout, sys.stderr, api_client=stubs.api, keep_client=stubs.keep_client)
  
-        make_output.assert_called_with(u'Output of submit_storage_class_wf.cwl', ['foo', 'bar'], '', {}, {"out": "zzzzz"})
+        make_output.assert_called_with(u'Output from workflow submit_storage_class_wf.cwl', ['foo', 'bar'], '', {}, {"out": "zzzzz"})
          self.assertEqual(exited, 0)
  
-    @stubs
+    @stubs()
      def test_submit_container_output_ttl(self, stubs):
          exited = arvados_cwl.main(
              ["--submit", "--no-wait", "--api=containers", "--debug", "--intermediate-output-ttl", "3600",
@@ -664,7 +664,8 @@ class TestSubmit(unittest.TestCase):
                                         '--no-log-timestamps', '--disable-validate', '--disable-color',
                                         '--eval-timeout=20', '--thread-count=0',
                                         '--enable-reuse', "--collection-cache-size=256",
-                                       "--output-name=Output from workflow submit_wf.cwl", '--debug',
+                                       '--output-name=Output from workflow submit_wf.cwl (%s)' % stubs.git_props["arv:gitDescribe"],
+                                       '--debug',
                                         '--on-error=continue',
                                         "--intermediate-output-ttl=3600",
                                         '/var/lib/cwl/workflow.json#main', '/var/lib/cwl/cwl.input.json']
@@ -675,7 +676,7 @@ class TestSubmit(unittest.TestCase):
                           stubs.expect_container_request_uuid + '\n')
          self.assertEqual(exited, 0)
  
-    @stubs
+    @stubs()
      def test_submit_container_trash_intermediate(self, stubs):
          exited = arvados_cwl.main(
              ["--submit", "--no-wait", "--api=containers", "--debug", "--trash-intermediate",
@@ -688,6 +689,7 @@ class TestSubmit(unittest.TestCase):
                                         '--no-log-timestamps', '--disable-validate', '--disable-color',
                                         '--eval-timeout=20', '--thread-count=0',
                                         '--enable-reuse', "--collection-cache-size=256",
+                                       '--output-name=Output from workflow submit_wf.cwl (%s)' % stubs.git_props["arv:gitDescribe"],
                                         '--debug', '--on-error=continue',
                                         "--trash-intermediate",
                                         '/var/lib/cwl/workflow.json#main', '/var/lib/cwl/cwl.input.json']
@@ -698,7 +700,7 @@ class TestSubmit(unittest.TestCase):
                           stubs.expect_container_request_uuid + '\n')
          self.assertEqual(exited, 0)
  
-    @stubs
+    @stubs()
      def test_submit_container_output_tags(self, stubs):
          output_tags = "tag0,tag1,tag2"
  
@@ -712,7 +714,7 @@ class TestSubmit(unittest.TestCase):
                                         '--no-log-timestamps', '--disable-validate', '--disable-color',
                                         '--eval-timeout=20', '--thread-count=0',
                                         '--enable-reuse', "--collection-cache-size=256",
-                                       "--output-name=Output from workflow submit_wf.cwl",
+                                       '--output-name=Output from workflow submit_wf.cwl (%s)' % stubs.git_props["arv:gitDescribe"],
                                         "--output-tags="+output_tags, '--debug', '--on-error=continue',
                                         '/var/lib/cwl/workflow.json#main', '/var/lib/cwl/cwl.input.json']
  
@@ -722,7 +724,7 @@ class TestSubmit(unittest.TestCase):
                           stubs.expect_container_request_uuid + '\n')
          self.assertEqual(exited, 0)
  
-    @stubs
+    @stubs()
      def test_submit_container_runner_ram(self, stubs):
          exited = arvados_cwl.main(
              ["--submit", "--no-wait", "--api=containers", "--debug", "--submit-runner-ram=2048",
@@ -740,7 +742,7 @@ class TestSubmit(unittest.TestCase):
  
      @mock.patch("arvados.collection.CollectionReader")
      @mock.patch("time.sleep")
-    @stubs
+    @stubs()
      def test_submit_file_keepref(self, stubs, tm, collectionReader):
          collectionReader().exists.return_value = True
          collectionReader().find.return_value = arvados.arvfile.ArvadosFile(mock.MagicMock(), "blorp.txt")
@@ -752,7 +754,7 @@ class TestSubmit(unittest.TestCase):
  
      @mock.patch("arvados.collection.CollectionReader")
      @mock.patch("time.sleep")
-    @stubs
+    @stubs()
      def test_submit_keepref(self, stubs, tm, reader):
          with open("tests/wf/expect_arvworkflow.cwl") as f:
              reader().open().__enter__().read.return_value = f.read()
@@ -813,13 +815,13 @@ class TestSubmit(unittest.TestCase):
          self.assertEqual(exited, 0)
  
      @mock.patch("time.sleep")
-    @stubs
+    @stubs()
      def test_submit_arvworkflow(self, stubs, tm):
          with open("tests/wf/expect_arvworkflow.cwl") as f:
              stubs.api.workflows().get().execute.return_value = {"definition": f.read(), "name": "a test workflow"}
  
          exited = arvados_cwl.main(
-            ["--submit", "--no-wait", "--api=containers", "--debug",
+            ["--submit", "--no-wait", "--api=containers", "--debug", "--disable-git",
               "962eh-7fd4e-gkbzl62qqtfig37", "-x", "XxX"],
              stubs.capture_stdout, sys.stderr, api_client=stubs.api)
  
@@ -863,8 +865,7 @@ class TestSubmit(unittest.TestCase):
                                  'requirements': [
                                      {
                                          'dockerPull': 'debian:buster-slim',
-                                        'class': 'DockerRequirement',
-                                        "http://arvados.org/cwl#dockerCollectionPDH": "999999999999999999999999999999d4+99"
+                                        'class': 'DockerRequirement'
                                      }
                                  ],
                                  'id': '#submit_tool.cwl',
@@ -888,8 +889,11 @@ class TestSubmit(unittest.TestCase):
              'command': ['arvados-cwl-runner', '--local', '--api=containers',
                          '--no-log-timestamps', '--disable-validate', '--disable-color',
                          '--eval-timeout=20', '--thread-count=0',
-                        '--enable-reuse', "--collection-cache-size=256", '--debug', '--on-error=continue',
+                        '--enable-reuse', "--collection-cache-size=256",
+                        "--output-name=Output from workflow a test workflow",
+                        '--debug', '--on-error=continue',
                          '/var/lib/cwl/workflow.json#main', '/var/lib/cwl/cwl.input.json'],
+            'output_name': 'Output from workflow a test workflow',
              'cwd': '/var/spool/cwl',
              'runtime_constraints': {
                  'API': True,
@@ -924,7 +928,7 @@ class TestSubmit(unittest.TestCase):
                           stubs.expect_container_request_uuid + '\n')
          self.assertEqual(exited, 0)
  
-    @stubs
+    @stubs()
      def test_submit_missing_input(self, stubs):
          exited = arvados_cwl.main(
              ["--submit", "--no-wait", "--api=containers", "--debug",
@@ -938,7 +942,7 @@ class TestSubmit(unittest.TestCase):
              stubs.capture_stdout, sys.stderr, api_client=stubs.api, keep_client=stubs.keep_client)
          self.assertEqual(exited, 1)
  
-    @stubs
+    @stubs()
      def test_submit_container_project(self, stubs):
          project_uuid = 'zzzzz-j7d0g-zzzzzzzzzzzzzzz'
          stubs.api.groups().get().execute.return_value = {"group_class": "project"}
@@ -953,7 +957,8 @@ class TestSubmit(unittest.TestCase):
                                         '--no-log-timestamps', '--disable-validate', '--disable-color',
                                         "--eval-timeout=20", "--thread-count=0",
                                         '--enable-reuse', "--collection-cache-size=256",
-                                       "--output-name=Output from workflow submit_wf.cwl", '--debug',
+                                       '--output-name=Output from workflow submit_wf.cwl (%s)' % stubs.git_props["arv:gitDescribe"],
+                                       '--debug',
                                         '--on-error=continue',
                                         '--project-uuid='+project_uuid,
                                         '/var/lib/cwl/workflow.json#main', '/var/lib/cwl/cwl.input.json']
@@ -964,7 +969,7 @@ class TestSubmit(unittest.TestCase):
                           stubs.expect_container_request_uuid + '\n')
          self.assertEqual(exited, 0)
  
-    @stubs
+    @stubs()
      def test_submit_container_eval_timeout(self, stubs):
          exited = arvados_cwl.main(
              ["--submit", "--no-wait", "--api=containers", "--debug", "--eval-timeout=60",
@@ -976,6 +981,7 @@ class TestSubmit(unittest.TestCase):
                                         '--no-log-timestamps', '--disable-validate', '--disable-color',
                                         '--eval-timeout=60.0', '--thread-count=0',
                                         '--enable-reuse', "--collection-cache-size=256",
+                                       '--output-name=Output from workflow submit_wf.cwl (%s)' % stubs.git_props["arv:gitDescribe"],
                                         '--debug', '--on-error=continue',
                                         '/var/lib/cwl/workflow.json#main', '/var/lib/cwl/cwl.input.json']
  
@@ -985,7 +991,7 @@ class TestSubmit(unittest.TestCase):
                           stubs.expect_container_request_uuid + '\n')
          self.assertEqual(exited, 0)
  
-    @stubs
+    @stubs()
      def test_submit_container_collection_cache(self, stubs):
          exited = arvados_cwl.main(
              ["--submit", "--no-wait", "--api=containers", "--debug", "--collection-cache-size=500",
@@ -997,6 +1003,7 @@ class TestSubmit(unittest.TestCase):
                                         '--no-log-timestamps', '--disable-validate', '--disable-color',
                                         '--eval-timeout=20', '--thread-count=0',
                                         '--enable-reuse', "--collection-cache-size=500",
+                                       '--output-name=Output from workflow submit_wf.cwl (%s)' % stubs.git_props["arv:gitDescribe"],
                                         '--debug', '--on-error=continue',
                                         '/var/lib/cwl/workflow.json#main', '/var/lib/cwl/cwl.input.json']
          expect_container["runtime_constraints"]["ram"] = (1024+500)*1024*1024
@@ -1007,7 +1014,7 @@ class TestSubmit(unittest.TestCase):
                           stubs.expect_container_request_uuid + '\n')
          self.assertEqual(exited, 0)
  
-    @stubs
+    @stubs()
      def test_submit_container_thread_count(self, stubs):
          exited = arvados_cwl.main(
              ["--submit", "--no-wait", "--api=containers", "--debug", "--thread-count=20",
@@ -1019,6 +1026,7 @@ class TestSubmit(unittest.TestCase):
                                         '--no-log-timestamps', '--disable-validate', '--disable-color',
                                         '--eval-timeout=20', '--thread-count=20',
                                         '--enable-reuse', "--collection-cache-size=256",
+                                       '--output-name=Output from workflow submit_wf.cwl (%s)' % stubs.git_props["arv:gitDescribe"],
                                         '--debug', '--on-error=continue',
                                         '/var/lib/cwl/workflow.json#main', '/var/lib/cwl/cwl.input.json']
  
@@ -1028,7 +1036,7 @@ class TestSubmit(unittest.TestCase):
                           stubs.expect_container_request_uuid + '\n')
          self.assertEqual(exited, 0)
  
-    @stubs
+    @stubs()
      def test_submit_container_runner_image(self, stubs):
          exited = arvados_cwl.main(
              ["--submit", "--no-wait", "--api=containers", "--debug", "--submit-runner-image=arvados/jobs:123",
@@ -1044,7 +1052,7 @@ class TestSubmit(unittest.TestCase):
                           stubs.expect_container_request_uuid + '\n')
          self.assertEqual(exited, 0)
  
-    @stubs
+    @stubs()
      def test_submit_priority(self, stubs):
          exited = arvados_cwl.main(
              ["--submit", "--no-wait", "--api=containers", "--debug", "--priority=669",
@@ -1148,13 +1156,16 @@ class TestSubmit(unittest.TestCase):
                           arvados_cwl.runner.arvados_jobs_image(arvrunner, "arvados/jobs:"+arvados_cwl.__version__, arvrunner.runtimeContext))
  
  
-    @stubs
+    @stubs()
      def test_submit_secrets(self, stubs):
          exited = arvados_cwl.main(
              ["--submit", "--no-wait", "--api=containers", "--debug",
                  "tests/wf/secret_wf.cwl", "tests/secret_test_job.yml"],
              stubs.capture_stdout, sys.stderr, api_client=stubs.api, keep_client=stubs.keep_client)
  
+        stubs.git_props["arv:gitPath"] = "sdk/cwl/tests/wf/secret_wf.cwl"
+        stubs.git_info["http://arvados.org/cwl#gitPath"] = "sdk/cwl/tests/wf/secret_wf.cwl"
+
          expect_container = {
              "command": [
                  "arvados-cwl-runner",
@@ -1167,8 +1178,8 @@ class TestSubmit(unittest.TestCase):
                  '--thread-count=0',
                  "--enable-reuse",
                  "--collection-cache-size=256",
-                '--output-name=Output from workflow secret_wf.cwl'
-                '--debug',
+                '--output-name=Output from workflow secret_wf.cwl (%s)' % stubs.git_props["arv:gitDescribe"],
+                "--debug",
                  "--on-error=continue",
                  "/var/lib/cwl/workflow.json#main",
                  "/var/lib/cwl/cwl.input.json"
@@ -1292,11 +1303,11 @@ class TestSubmit(unittest.TestCase):
                      "path": "/var/spool/cwl/cwl.output.json"
                  }
              },
-            "name": "secret_wf.cwl",
-            "output_name": "Output from workflow secret_wf.cwl",
+            "name": "secret_wf.cwl (%s)" % stubs.git_props["arv:gitDescribe"],
+            "output_name": "Output from workflow secret_wf.cwl (%s)" % stubs.git_props["arv:gitDescribe"],
              "output_path": "/var/spool/cwl",
              "priority": 500,
-            "properties": {},
+            "properties": stubs.git_props,
              "runtime_constraints": {
                  "API": True,
                  "ram": 1342177280,
@@ -1312,13 +1323,15 @@ class TestSubmit(unittest.TestCase):
              "use_existing": False
          }
  
+        expect_container["mounts"]["/var/lib/cwl/workflow.json"]["content"].update(stubs.git_info)
+
          stubs.api.container_requests().create.assert_called_with(
              body=JsonDiffMatcher(expect_container))
          self.assertEqual(stubs.capture_stdout.getvalue(),
                           stubs.expect_container_request_uuid + '\n')
          self.assertEqual(exited, 0)
  
-    @stubs
+    @stubs()
      def test_submit_request_uuid(self, stubs):
          stubs.api._rootDesc["remoteHosts"]["zzzzz"] = "123"
          stubs.expect_container_request_uuid = "zzzzz-xvhdp-yyyyyyyyyyyyyyy"
@@ -1340,7 +1353,7 @@ class TestSubmit(unittest.TestCase):
                           stubs.expect_container_request_uuid + '\n')
          self.assertEqual(exited, 0)
  
-    @stubs
+    @stubs()
      def test_submit_container_cluster_id(self, stubs):
          stubs.api._rootDesc["remoteHosts"]["zbbbb"] = "123"
  
@@ -1357,7 +1370,7 @@ class TestSubmit(unittest.TestCase):
                           stubs.expect_container_request_uuid + '\n')
          self.assertEqual(exited, 0)
  
-    @stubs
+    @stubs()
      def test_submit_validate_cluster_id(self, stubs):
          stubs.api._rootDesc["remoteHosts"]["zbbbb"] = "123"
          exited = arvados_cwl.main(
@@ -1366,7 +1379,7 @@ class TestSubmit(unittest.TestCase):
              stubs.capture_stdout, sys.stderr, api_client=stubs.api, keep_client=stubs.keep_client)
          self.assertEqual(exited, 1)
  
-    @stubs
+    @stubs()
      def test_submit_validate_project_uuid(self, stubs):
          # Fails with bad cluster prefix
          exited = arvados_cwl.main(
@@ -1392,7 +1405,7 @@ class TestSubmit(unittest.TestCase):
  
  
      @mock.patch("arvados.collection.CollectionReader")
-    @stubs
+    @stubs()
      def test_submit_uuid_inputs(self, stubs, collectionReader):
          collectionReader().exists.return_value = True
          collectionReader().find.return_value = arvados.arvfile.ArvadosFile(mock.MagicMock(), "file1.txt")
@@ -1427,7 +1440,7 @@ class TestSubmit(unittest.TestCase):
                           stubs.expect_container_request_uuid + '\n')
          self.assertEqual(exited, 0)
  
-    @stubs
+    @stubs()
      def test_submit_mismatched_uuid_inputs(self, stubs):
          def list_side_effect(**kwargs):
              m = mock.MagicMock()
@@ -1460,7 +1473,7 @@ class TestSubmit(unittest.TestCase):
                  cwltool_logger.removeHandler(stderr_logger)
  
      @mock.patch("arvados.collection.CollectionReader")
-    @stubs
+    @stubs()
      def test_submit_unknown_uuid_inputs(self, stubs, collectionReader):
          collectionReader().find.return_value = arvados.arvfile.ArvadosFile(mock.MagicMock(), "file1.txt")
          capture_stderr = StringIO()
@@ -1528,7 +1541,7 @@ class TestSubmit(unittest.TestCase):
          self.assertEqual(exited, 0)
  
  
-    @stubs
+    @stubs()
      def test_submit_enable_preemptible(self, stubs):
          exited = arvados_cwl.main(
              ["--submit", "--no-wait", "--api=containers", "--debug", "--enable-preemptible",
@@ -1537,11 +1550,13 @@ class TestSubmit(unittest.TestCase):
  
          expect_container = copy.deepcopy(stubs.expect_container_spec)
          expect_container['command'] = ['arvados-cwl-runner', '--local', '--api=containers',
-                        '--no-log-timestamps', '--disable-validate', '--disable-color',
-                        '--eval-timeout=20', '--thread-count=0',
-                        '--enable-reuse', "--collection-cache-size=256", '--debug', '--on-error=continue',
+                                       '--no-log-timestamps', '--disable-validate', '--disable-color',
+                                       '--eval-timeout=20', '--thread-count=0',
+                                       '--enable-reuse', "--collection-cache-size=256",
+                                       '--output-name=Output from workflow submit_wf.cwl (%s)' % stubs.git_props["arv:gitDescribe"],
+                                       '--debug', '--on-error=continue',
                                         '--enable-preemptible',
-                        '/var/lib/cwl/workflow.json#main', '/var/lib/cwl/cwl.input.json']
+                                       '/var/lib/cwl/workflow.json#main', '/var/lib/cwl/cwl.input.json']
  
          stubs.api.container_requests().create.assert_called_with(
              body=JsonDiffMatcher(expect_container))
@@ -1549,7 +1564,7 @@ class TestSubmit(unittest.TestCase):
                           stubs.expect_container_request_uuid + '\n')
          self.assertEqual(exited, 0)
  
-    @stubs
+    @stubs()
      def test_submit_disable_preemptible(self, stubs):
          exited = arvados_cwl.main(
              ["--submit", "--no-wait", "--api=containers", "--debug", "--disable-preemptible",
@@ -1558,11 +1573,57 @@ class TestSubmit(unittest.TestCase):
  
          expect_container = copy.deepcopy(stubs.expect_container_spec)
          expect_container['command'] = ['arvados-cwl-runner', '--local', '--api=containers',
-                        '--no-log-timestamps', '--disable-validate', '--disable-color',
-                        '--eval-timeout=20', '--thread-count=0',
-                        '--enable-reuse', "--collection-cache-size=256", '--debug', '--on-error=continue',
+                                       '--no-log-timestamps', '--disable-validate', '--disable-color',
+                                       '--eval-timeout=20', '--thread-count=0',
+                                       '--enable-reuse', "--collection-cache-size=256",
+                                       '--output-name=Output from workflow submit_wf.cwl (%s)' % stubs.git_props["arv:gitDescribe"],
+                                       '--debug', '--on-error=continue',
                                         '--disable-preemptible',
-                        '/var/lib/cwl/workflow.json#main', '/var/lib/cwl/cwl.input.json']
+                                       '/var/lib/cwl/workflow.json#main', '/var/lib/cwl/cwl.input.json']
+
+        stubs.api.container_requests().create.assert_called_with(
+            body=JsonDiffMatcher(expect_container))
+        self.assertEqual(stubs.capture_stdout.getvalue(),
+                         stubs.expect_container_request_uuid + '\n')
+        self.assertEqual(exited, 0)
+
+    @stubs()
+    def test_submit_container_prefer_cached_downloads(self, stubs):
+        exited = arvados_cwl.main(
+            ["--submit", "--no-wait", "--api=containers", "--debug", "--prefer-cached-downloads",
+                "tests/wf/submit_wf.cwl", "tests/submit_test_job.json"],
+            stubs.capture_stdout, sys.stderr, api_client=stubs.api, keep_client=stubs.keep_client)
+
+        expect_container = copy.deepcopy(stubs.expect_container_spec)
+        expect_container["command"] = ['arvados-cwl-runner', '--local', '--api=containers',
+                                       '--no-log-timestamps', '--disable-validate', '--disable-color',
+                                       '--eval-timeout=20', '--thread-count=0',
+                                       '--enable-reuse', "--collection-cache-size=256",
+                                       '--output-name=Output from workflow submit_wf.cwl (%s)' % stubs.git_props["arv:gitDescribe"],
+                                       '--debug', "--on-error=continue", '--prefer-cached-downloads',
+                                       '/var/lib/cwl/workflow.json#main', '/var/lib/cwl/cwl.input.json']
+
+        stubs.api.container_requests().create.assert_called_with(
+            body=JsonDiffMatcher(expect_container))
+        self.assertEqual(stubs.capture_stdout.getvalue(),
+                         stubs.expect_container_request_uuid + '\n')
+        self.assertEqual(exited, 0)
+
+    @stubs()
+    def test_submit_container_varying_url_params(self, stubs):
+        exited = arvados_cwl.main(
+            ["--submit", "--no-wait", "--api=containers", "--debug", "--varying-url-params", "KeyId,Signature",
+                "tests/wf/submit_wf.cwl", "tests/submit_test_job.json"],
+            stubs.capture_stdout, sys.stderr, api_client=stubs.api, keep_client=stubs.keep_client)
+
+        expect_container = copy.deepcopy(stubs.expect_container_spec)
+        expect_container["command"] = ['arvados-cwl-runner', '--local', '--api=containers',
+                                       '--no-log-timestamps', '--disable-validate', '--disable-color',
+                                       '--eval-timeout=20', '--thread-count=0',
+                                       '--enable-reuse', "--collection-cache-size=256",
+                                       '--output-name=Output from workflow submit_wf.cwl (%s)' % stubs.git_props["arv:gitDescribe"],
+                                       '--debug', "--on-error=continue", "--varying-url-params=KeyId,Signature",
+                                       '/var/lib/cwl/workflow.json#main', '/var/lib/cwl/cwl.input.json']
  
          stubs.api.container_requests().create.assert_called_with(
              body=JsonDiffMatcher(expect_container))
@@ -1574,7 +1635,9 @@ class TestSubmit(unittest.TestCase):
  class TestCreateWorkflow(unittest.TestCase):
      existing_workflow_uuid = "zzzzz-7fd4e-validworkfloyml"
      expect_workflow = StripYAMLComments(
-        open("tests/wf/expect_upload_packed.cwl").read().rstrip())
+        open("tests/wf/expect_upload_wrapper.cwl").read().rstrip())
+    expect_workflow_altname = StripYAMLComments(
+        open("tests/wf/expect_upload_wrapper_altname.cwl").read().rstrip())
  
      def setUp(self):
          cwltool.process._names = set()
@@ -1587,7 +1650,7 @@ class TestCreateWorkflow(unittest.TestCase):
          handlers = [h for h in root_logger.handlers if not isinstance(h, arvados_cwl.executor.RuntimeStatusLoggingHandler)]
          root_logger.handlers = handlers
  
-    @stubs
+    @stubs()
      def test_create(self, stubs):
          project_uuid = 'zzzzz-j7d0g-zzzzzzzzzzzzzzz'
          stubs.api.groups().get().execute.return_value = {"group_class": "project"}
@@ -1596,6 +1659,7 @@ class TestCreateWorkflow(unittest.TestCase):
              ["--create-workflow", "--debug",
               "--api=containers",
               "--project-uuid", project_uuid,
+             "--disable-git",
               "tests/wf/submit_wf.cwl", "tests/submit_test_job.json"],
              stubs.capture_stdout, sys.stderr, api_client=stubs.api)
  
@@ -1617,7 +1681,7 @@ class TestCreateWorkflow(unittest.TestCase):
                           stubs.expect_workflow_uuid + '\n')
          self.assertEqual(exited, 0)
  
-    @stubs
+    @stubs()
      def test_create_name(self, stubs):
          project_uuid = 'zzzzz-j7d0g-zzzzzzzzzzzzzzz'
          stubs.api.groups().get().execute.return_value = {"group_class": "project"}
@@ -1627,6 +1691,7 @@ class TestCreateWorkflow(unittest.TestCase):
               "--api=containers",
               "--project-uuid", project_uuid,
               "--name", "testing 123",
+             "--disable-git",
               "tests/wf/submit_wf.cwl", "tests/submit_test_job.json"],
              stubs.capture_stdout, sys.stderr, api_client=stubs.api)
  
@@ -1638,7 +1703,7 @@ class TestCreateWorkflow(unittest.TestCase):
                  "owner_uuid": project_uuid,
                  "name": "testing 123",
                  "description": "",
-                "definition": self.expect_workflow,
+                "definition": self.expect_workflow_altname,
              }
          }
          stubs.api.workflows().create.assert_called_with(
@@ -1649,7 +1714,7 @@ class TestCreateWorkflow(unittest.TestCase):
          self.assertEqual(exited, 0)
  
  
-    @stubs
+    @stubs()
      def test_update(self, stubs):
          project_uuid = 'zzzzz-j7d0g-zzzzzzzzzzzzzzz'
          stubs.api.workflows().get().execute.return_value = {"owner_uuid": project_uuid}
@@ -1657,6 +1722,7 @@ class TestCreateWorkflow(unittest.TestCase):
          exited = arvados_cwl.main(
              ["--update-workflow", self.existing_workflow_uuid,
               "--debug",
+             "--disable-git",
               "tests/wf/submit_wf.cwl", "tests/submit_test_job.json"],
              stubs.capture_stdout, sys.stderr, api_client=stubs.api)
  
@@ -1676,7 +1742,7 @@ class TestCreateWorkflow(unittest.TestCase):
          self.assertEqual(exited, 0)
  
  
-    @stubs
+    @stubs()
      def test_update_name(self, stubs):
          project_uuid = 'zzzzz-j7d0g-zzzzzzzzzzzzzzz'
          stubs.api.workflows().get().execute.return_value = {"owner_uuid": project_uuid}
@@ -1684,6 +1750,7 @@ class TestCreateWorkflow(unittest.TestCase):
          exited = arvados_cwl.main(
              ["--update-workflow", self.existing_workflow_uuid,
               "--debug", "--name", "testing 123",
+             "--disable-git",
               "tests/wf/submit_wf.cwl", "tests/submit_test_job.json"],
              stubs.capture_stdout, sys.stderr, api_client=stubs.api)
  
@@ -1691,7 +1758,7 @@ class TestCreateWorkflow(unittest.TestCase):
              "workflow": {
                  "name": "testing 123",
                  "description": "",
-                "definition": self.expect_workflow,
+                "definition": self.expect_workflow_altname,
                  "owner_uuid": project_uuid
              }
          }
@@ -1702,7 +1769,7 @@ class TestCreateWorkflow(unittest.TestCase):
                           self.existing_workflow_uuid + '\n')
          self.assertEqual(exited, 0)
  
-    @stubs
+    @stubs()
      def test_create_collection_per_tool(self, stubs):
          project_uuid = 'zzzzz-j7d0g-zzzzzzzzzzzzzzz'
          stubs.api.groups().get().execute.return_value = {"group_class": "project"}
@@ -1711,10 +1778,11 @@ class TestCreateWorkflow(unittest.TestCase):
              ["--create-workflow", "--debug",
               "--api=containers",
               "--project-uuid", project_uuid,
+             "--disable-git",
               "tests/collection_per_tool/collection_per_tool.cwl"],
              stubs.capture_stdout, sys.stderr, api_client=stubs.api)
  
-        toolfile = "tests/collection_per_tool/collection_per_tool_packed.cwl"
+        toolfile = "tests/collection_per_tool/collection_per_tool_wrapper.cwl"
          expect_workflow = StripYAMLComments(open(toolfile).read().rstrip())
  
          body = {
@@ -1732,7 +1800,7 @@ class TestCreateWorkflow(unittest.TestCase):
                           stubs.expect_workflow_uuid + '\n')
          self.assertEqual(exited, 0)
  
-    @stubs
+    @stubs()
      def test_create_with_imports(self, stubs):
          project_uuid = 'zzzzz-j7d0g-zzzzzzzzzzzzzzz'
          stubs.api.groups().get().execute.return_value = {"group_class": "project"}
@@ -1751,7 +1819,7 @@ class TestCreateWorkflow(unittest.TestCase):
                           stubs.expect_workflow_uuid + '\n')
          self.assertEqual(exited, 0)
  
-    @stubs
+    @stubs()
      def test_create_with_no_input(self, stubs):
          project_uuid = 'zzzzz-j7d0g-zzzzzzzzzzzzzzz'
          stubs.api.groups().get().execute.return_value = {"group_class": "project"}
diff --git a/sdk/cwl/tests/wf/expect_upload_wrapper.cwl b/sdk/cwl/tests/wf/expect_upload_wrapper.cwl

new file mode 100644 (file)

index 0000000..3821527
--- /dev/null
+++ b/sdk/cwl/tests/wf/expect_upload_wrapper.cwl
@@ -0,0 +1,89 @@
+# Copyright (C) The Arvados Authors. All rights reserved.
+#
+# SPDX-License-Identifier: Apache-2.0
+
+{
+    "$graph": [
+        {
+            "class": "Workflow",
+            "hints": [
+                {
+                    "acrContainerImage": "999999999999999999999999999999d3+99",
+                    "class": "http://arvados.org/cwl#WorkflowRunnerResources"
+                }
+            ],
+            "id": "#main",
+            "inputs": [
+                {
+                    "default": {
+                        "basename": "blorp.txt",
+                        "class": "File",
+                        "location": "keep:169f39d466a5438ac4a90e779bf750c7+53/blorp.txt",
+                        "nameext": ".txt",
+                        "nameroot": "blorp",
+                        "size": 16
+                    },
+                    "id": "#main/x",
+                    "type": "File"
+                },
+                {
+                    "default": {
+                        "basename": "99999999999999999999999999999998+99",
+                        "class": "Directory",
+                        "location": "keep:99999999999999999999999999999998+99"
+                    },
+                    "id": "#main/y",
+                    "type": "Directory"
+                },
+                {
+                    "default": {
+                        "basename": "anonymous",
+                        "class": "Directory",
+                        "listing": [
+                            {
+                                "basename": "renamed.txt",
+                                "class": "File",
+                                "location": "keep:99999999999999999999999999999998+99/file1.txt",
+                                "nameext": ".txt",
+                                "nameroot": "renamed",
+                                "size": 0
+                            }
+                        ],
+                        "location": "_:df80736f-f14d-4b10-b2e3-03aa27f034b2"
+                    },
+                    "id": "#main/z",
+                    "type": "Directory"
+                }
+            ],
+            "outputs": [],
+            "requirements": [
+                {
+                    "class": "SubworkflowFeatureRequirement"
+                }
+            ],
+            "steps": [
+                {
+                    "id": "#main/submit_wf.cwl",
+                    "in": [
+                        {
+                            "id": "#main/step/x",
+                            "source": "#main/x"
+                        },
+                        {
+                            "id": "#main/step/y",
+                            "source": "#main/y"
+                        },
+                        {
+                            "id": "#main/step/z",
+                            "source": "#main/z"
+                        }
+                    ],
+                    "label": "submit_wf.cwl",
+                    "out": [],
+                    "run": "keep:f1c2b0c514a5fb9b2a8b5b38a31bab66+61/workflow.json#main"
+                }
+            ]
+        }
+    ],
+    "cwlVersion": "v1.2"
+}
diff --git a/sdk/cwl/tests/wf/expect_upload_wrapper_altname.cwl b/sdk/cwl/tests/wf/expect_upload_wrapper_altname.cwl

new file mode 100644 (file)

index 0000000..d486e5a
--- /dev/null
+++ b/sdk/cwl/tests/wf/expect_upload_wrapper_altname.cwl
@@ -0,0 +1,89 @@
+# Copyright (C) The Arvados Authors. All rights reserved.
+#
+# SPDX-License-Identifier: Apache-2.0
+
+{
+    "$graph": [
+        {
+            "class": "Workflow",
+            "hints": [
+                {
+                    "acrContainerImage": "999999999999999999999999999999d3+99",
+                    "class": "http://arvados.org/cwl#WorkflowRunnerResources"
+                }
+            ],
+            "id": "#main",
+            "inputs": [
+                {
+                    "default": {
+                        "basename": "blorp.txt",
+                        "class": "File",
+                        "location": "keep:169f39d466a5438ac4a90e779bf750c7+53/blorp.txt",
+                        "nameext": ".txt",
+                        "nameroot": "blorp",
+                        "size": 16
+                    },
+                    "id": "#main/x",
+                    "type": "File"
+                },
+                {
+                    "default": {
+                        "basename": "99999999999999999999999999999998+99",
+                        "class": "Directory",
+                        "location": "keep:99999999999999999999999999999998+99"
+                    },
+                    "id": "#main/y",
+                    "type": "Directory"
+                },
+                {
+                    "default": {
+                        "basename": "anonymous",
+                        "class": "Directory",
+                        "listing": [
+                            {
+                                "basename": "renamed.txt",
+                                "class": "File",
+                                "location": "keep:99999999999999999999999999999998+99/file1.txt",
+                                "nameext": ".txt",
+                                "nameroot": "renamed",
+                                "size": 0
+                            }
+                        ],
+                        "location": "_:df80736f-f14d-4b10-b2e3-03aa27f034b2"
+                    },
+                    "id": "#main/z",
+                    "type": "Directory"
+                }
+            ],
+            "outputs": [],
+            "requirements": [
+                {
+                    "class": "SubworkflowFeatureRequirement"
+                }
+            ],
+            "steps": [
+                {
+                    "id": "#main/submit_wf.cwl",
+                    "in": [
+                        {
+                            "id": "#main/step/x",
+                            "source": "#main/x"
+                        },
+                        {
+                            "id": "#main/step/y",
+                            "source": "#main/y"
+                        },
+                        {
+                            "id": "#main/step/z",
+                            "source": "#main/z"
+                        }
+                    ],
+                    "label": "testing 123",
+                    "out": [],
+                    "run": "keep:f1c2b0c514a5fb9b2a8b5b38a31bab66+61/workflow.json#main"
+                }
+            ]
+        }
+    ],
+    "cwlVersion": "v1.2"
+}
diff --git a/sdk/dev-jobs.dockerfile b/sdk/dev-jobs.dockerfile

index b55b056b2d38339fe4bb42ddd15ba267099975ea..60db4a889815c1f66e9c1070b35b1077fc5b1d8b 100644 (file)
--- a/sdk/dev-jobs.dockerfile
+++ b/sdk/dev-jobs.dockerfile
@@ -35,11 +35,17 @@ ADD cwl/salad_dist/$salad /tmp/
  ADD cwl/cwltool_dist/$cwltool /tmp/
  ADD cwl/dist/$runner /tmp/
  
+RUN $pipcmd install wheel
  RUN cd /tmp/arvados-python-client-* && $pipcmd install .
  RUN if test -d /tmp/schema-salad-* ; then cd /tmp/schema-salad-* && $pipcmd install . ; fi
  RUN if test -d /tmp/cwltool-* ; then cd /tmp/cwltool-* && $pipcmd install . ; fi
  RUN cd /tmp/arvados-cwl-runner-* && $pipcmd install .
  
+# Sometimes Python dependencies install successfully but don't
+# actually work.  So run arvados-cwl-runner here to catch fun
+# dependency errors like pkg_resources.DistributionNotFound.
+RUN arvados-cwl-runner --version
+
  # Install dependencies and set up system.
  RUN /usr/sbin/adduser --disabled-password \
        --gecos 'Crunch execution user' crunch && \
diff --git a/sdk/go/arvados/api.go b/sdk/go/arvados/api.go

index 3797a17f50d504ae2894ac4c6a68f598b4e37564..bec387e85737f9d745c81bc6f1fbc5dae54f27cf 100644 (file)
--- a/sdk/go/arvados/api.go
+++ b/sdk/go/arvados/api.go
@@ -70,6 +70,11 @@ var (
         EndpointLinkGet                       = APIEndpoint{"GET", "arvados/v1/links/{uuid}", ""}
         EndpointLinkList                      = APIEndpoint{"GET", "arvados/v1/links", ""}
         EndpointLinkDelete                    = APIEndpoint{"DELETE", "arvados/v1/links/{uuid}", ""}
+       EndpointLogCreate                     = APIEndpoint{"POST", "arvados/v1/logs", "log"}
+       EndpointLogUpdate                     = APIEndpoint{"PATCH", "arvados/v1/logs/{uuid}", "log"}
+       EndpointLogGet                        = APIEndpoint{"GET", "arvados/v1/logs/{uuid}", ""}
+       EndpointLogList                       = APIEndpoint{"GET", "arvados/v1/logs", ""}
+       EndpointLogDelete                     = APIEndpoint{"DELETE", "arvados/v1/logs/{uuid}", ""}
         EndpointSysTrashSweep                 = APIEndpoint{"POST", "sys/trash_sweep", ""}
         EndpointUserActivate                  = APIEndpoint{"POST", "arvados/v1/users/{uuid}/activate", ""}
         EndpointUserCreate                    = APIEndpoint{"POST", "arvados/v1/users", "user"}
@@ -284,6 +289,11 @@ type API interface {
         LinkGet(ctx context.Context, options GetOptions) (Link, error)
         LinkList(ctx context.Context, options ListOptions) (LinkList, error)
         LinkDelete(ctx context.Context, options DeleteOptions) (Link, error)
+       LogCreate(ctx context.Context, options CreateOptions) (Log, error)
+       LogUpdate(ctx context.Context, options UpdateOptions) (Log, error)
+       LogGet(ctx context.Context, options GetOptions) (Log, error)
+       LogList(ctx context.Context, options ListOptions) (LogList, error)
+       LogDelete(ctx context.Context, options DeleteOptions) (Log, error)
         SpecimenCreate(ctx context.Context, options CreateOptions) (Specimen, error)
         SpecimenUpdate(ctx context.Context, options UpdateOptions) (Specimen, error)
         SpecimenGet(ctx context.Context, options GetOptions) (Specimen, error)
diff --git a/sdk/go/arvados/client.go b/sdk/go/arvados/client.go

index cdc07bb0afd2c80b09985ad28f18c6c0fa1abcde..4d140517e53687e7d62f9d211a1c566825a631f4 100644 (file)
--- a/sdk/go/arvados/client.go
+++ b/sdk/go/arvados/client.go
@@ -7,6 +7,7 @@ package arvados
  import (
         "bytes"
         "context"
+       "crypto/rand"
         "crypto/tls"
         "encoding/json"
         "errors"
@@ -15,6 +16,7 @@ import (
         "io/fs"
         "io/ioutil"
         "log"
+       "math/big"
         "net"
         "net/http"
         "net/url"
@@ -151,10 +153,10 @@ func NewClientFromConfig(cluster *Cluster) (*Client, error) {
  // Space characters are trimmed when reading the settings file, so
  // these are equivalent:
  //
-//   ARVADOS_API_HOST=localhost\n
-//   ARVADOS_API_HOST=localhost\r\n
-//   ARVADOS_API_HOST = localhost \n
-//   \tARVADOS_API_HOST = localhost\n
+//     ARVADOS_API_HOST=localhost\n
+//     ARVADOS_API_HOST=localhost\r\n
+//     ARVADOS_API_HOST = localhost \n
+//     \tARVADOS_API_HOST = localhost\n
  func NewClientFromEnv() *Client {
         vars := map[string]string{}
         home := os.Getenv("HOME")
@@ -328,11 +330,11 @@ func (c *Client) DoAndDecode(dst interface{}, req *http.Request) error {
  
  // Convert an arbitrary struct to url.Values. For example,
  //
-//     Foo{Bar: []int{1,2,3}, Baz: "waz"}
+//     Foo{Bar: []int{1,2,3}, Baz: "waz"}
  //
  // becomes
  //
-//     url.Values{`bar`:`{"a":[1,2,3]}`,`Baz`:`waz`}
+//     url.Values{`bar`:`{"a":[1,2,3]}`,`Baz`:`waz`}
  //
  // params itself is returned if it is already an url.Values.
  func anythingToValues(params interface{}) (url.Values, error) {
@@ -599,3 +601,13 @@ func (c *Client) PathForUUID(method, uuid string) (string, error) {
         }
         return path, nil
  }
+
+var maxUUIDInt = (&big.Int{}).Exp(big.NewInt(36), big.NewInt(15), nil)
+
+func RandomUUID(clusterID, infix string) string {
+       n, err := rand.Int(rand.Reader, maxUUIDInt)
+       if err != nil {
+               panic(err)
+       }
+       return clusterID + "-" + infix + "-" + n.Text(36)
+}
diff --git a/sdk/go/arvados/config.go b/sdk/go/arvados/config.go

index eb564cb6102f2f16249bd37e8ac0ecbfe5bf579c..bc6aab298fdcab19991528c1949b9d7bbac5efaf 100644 (file)
--- a/sdk/go/arvados/config.go
+++ b/sdk/go/arvados/config.go
@@ -200,11 +200,12 @@ type Cluster struct {
                         Enable bool
                         Users  map[string]TestUser
                 }
-               LoginCluster       string
-               RemoteTokenRefresh Duration
-               TokenLifetime      Duration
-               TrustedClients     map[string]struct{}
-               IssueTrustedTokens bool
+               LoginCluster         string
+               RemoteTokenRefresh   Duration
+               TokenLifetime        Duration
+               TrustedClients       map[URL]struct{}
+               TrustPrivateNetworks bool
+               IssueTrustedTokens   bool
         }
         Mail struct {
                 MailchimpAPIKey                string
@@ -248,6 +249,7 @@ type Cluster struct {
                 PreferDomainForUsername               string
                 UserSetupMailText                     string
                 RoleGroupsVisibleToAll                bool
+               ActivityLoggingPeriod                 Duration
         }
         StorageClasses map[string]StorageClassConfig
         Volumes        map[string]Volume
@@ -290,6 +292,7 @@ type Cluster struct {
                 SSHHelpPageHTML        string
                 SSHHelpHostSuffix      string
                 IdleTimeout            Duration
+               BannerURL              string
         }
  }
  
@@ -393,7 +396,7 @@ func (su *URL) UnmarshalText(text []byte) error {
  }
  
  func (su URL) MarshalText() ([]byte, error) {
-       return []byte(fmt.Sprintf("%s", (*url.URL)(&su).String())), nil
+       return []byte(su.String()), nil
  }
  
  func (su URL) String() string {
@@ -444,6 +447,7 @@ type ContainersConfig struct {
         CrunchRunCommand              string
         CrunchRunArgumentsList        []string
         DefaultKeepCacheRAM           ByteSize
+       DefaultKeepCacheDisk          ByteSize
         DispatchPrivateKey            string
         LogReuseDecisions             bool
         MaxComputeVMs                 int
@@ -465,6 +469,7 @@ type ContainersConfig struct {
         }
         Logging struct {
                 MaxAge                       Duration
+               SweepInterval                Duration
                 LogBytesPerEvent             int
                 LogSecondsBetweenEvents      Duration
                 LogThrottlePeriod            Duration
@@ -532,9 +537,11 @@ type InstanceTypeMap map[string]InstanceType
  var errDuplicateInstanceTypeName = errors.New("duplicate instance type name")
  
  // UnmarshalJSON does special handling of InstanceTypes:
-// * populate computed fields (Name and Scratch)
-// * error out if InstancesTypes are populated as an array, which was
-//   deprecated in Arvados 1.2.0
+//
+// - populate computed fields (Name and Scratch)
+//
+// - error out if InstancesTypes are populated as an array, which was
+// deprecated in Arvados 1.2.0
  func (it *InstanceTypeMap) UnmarshalJSON(data []byte) error {
         fixup := func(t InstanceType) (InstanceType, error) {
                 if t.ProviderType == "" {
diff --git a/sdk/go/arvados/container.go b/sdk/go/arvados/container.go

index 45f92017c4d02be4a6d4063439ea8cd515dbd268..165c8112e8f1ed39cde40e2b6a913072ced0fe32 100644 (file)
--- a/sdk/go/arvados/container.go
+++ b/sdk/go/arvados/container.go
@@ -107,11 +107,12 @@ type CUDARuntimeConstraints struct {
  // RuntimeConstraints specify a container's compute resources (RAM,
  // CPU) and network connectivity.
  type RuntimeConstraints struct {
-       API          bool                   `json:"API"`
-       RAM          int64                  `json:"ram"`
-       VCPUs        int                    `json:"vcpus"`
-       KeepCacheRAM int64                  `json:"keep_cache_ram"`
-       CUDA         CUDARuntimeConstraints `json:"cuda"`
+       API           bool                   `json:"API"`
+       RAM           int64                  `json:"ram"`
+       VCPUs         int                    `json:"vcpus"`
+       KeepCacheRAM  int64                  `json:"keep_cache_ram"`
+       KeepCacheDisk int64                  `json:"keep_cache_disk"`
+       CUDA          CUDARuntimeConstraints `json:"cuda"`
  }
  
  // SchedulingParameters specify a container's scheduling parameters
diff --git a/sdk/go/arvados/duration.go b/sdk/go/arvados/duration.go

index c922f0a30dd49abd0f11b29f94d2ced6a8ea09cb..9df210ccb016ef85327b9eaf09ca3aacec0ae9f2 100644 (file)
--- a/sdk/go/arvados/duration.go
+++ b/sdk/go/arvados/duration.go
@@ -5,6 +5,7 @@
  package arvados
  
  import (
+       "bytes"
         "encoding/json"
         "fmt"
         "strings"
@@ -17,6 +18,13 @@ type Duration time.Duration
  
  // UnmarshalJSON implements json.Unmarshaler.
  func (d *Duration) UnmarshalJSON(data []byte) error {
+       if bytes.Equal(data, []byte(`"0"`)) || bytes.Equal(data, []byte(`0`)) {
+               // Unitless 0 is not accepted by ParseDuration, but we
+               // accept it as a reasonable spelling of 0
+               // nanoseconds.
+               *d = 0
+               return nil
+       }
         if data[0] == '"' {
                 return d.Set(string(data[1 : len(data)-1]))
         }
diff --git a/sdk/go/arvados/duration_test.go b/sdk/go/arvados/duration_test.go

index 6a198e69400201f803566b4e19022158956c50be..40344d061b0682327ded9ab016a8865410a923d5 100644 (file)
--- a/sdk/go/arvados/duration_test.go
+++ b/sdk/go/arvados/duration_test.go
@@ -60,4 +60,14 @@ func (s *DurationSuite) TestUnmarshalJSON(c *check.C) {
         err = json.Unmarshal([]byte(`{"D":"60s"}`), &d)
         c.Check(err, check.IsNil)
         c.Check(d.D.Duration(), check.Equals, time.Minute)
+
+       d.D = Duration(time.Second)
+       err = json.Unmarshal([]byte(`{"D":"0"}`), &d)
+       c.Check(err, check.IsNil)
+       c.Check(d.D.Duration(), check.Equals, time.Duration(0))
+
+       d.D = Duration(time.Second)
+       err = json.Unmarshal([]byte(`{"D":0}`), &d)
+       c.Check(err, check.IsNil)
+       c.Check(d.D.Duration(), check.Equals, time.Duration(0))
  }
diff --git a/sdk/go/arvados/fs_collection.go b/sdk/go/arvados/fs_collection.go

index a26c876b932304ab6fdfefbafe36145665cbac90..354658a257dba00d54f9d98f9f7c1328e84b7ae2 100644 (file)
--- a/sdk/go/arvados/fs_collection.go
+++ b/sdk/go/arvados/fs_collection.go
@@ -513,9 +513,9 @@ type filenodePtr struct {
  //
  // After seeking:
  //
-//     ptr.segmentIdx == len(filenode.segments) // i.e., at EOF
-//     ||
-//     filenode.segments[ptr.segmentIdx].Len() > ptr.segmentOff
+//     ptr.segmentIdx == len(filenode.segments) // i.e., at EOF
+//     ||
+//     filenode.segments[ptr.segmentIdx].Len() > ptr.segmentOff
  func (fn *filenode) seek(startPtr filenodePtr) (ptr filenodePtr) {
         ptr = startPtr
         if ptr.off < 0 {
diff --git a/sdk/go/arvados/log.go b/sdk/go/arvados/log.go

index 6f72634e5457e7379ee6660297be9aced63b91a0..06d7987e321299af7577084c043c0e56b5c664da 100644 (file)
--- a/sdk/go/arvados/log.go
+++ b/sdk/go/arvados/log.go
@@ -12,12 +12,15 @@ import (
  type Log struct {
         ID              uint64                 `json:"id"`
         UUID            string                 `json:"uuid"`
+       OwnerUUID       string                 `json:"owner_uuid"`
         ObjectUUID      string                 `json:"object_uuid"`
         ObjectOwnerUUID string                 `json:"object_owner_uuid"`
         EventType       string                 `json:"event_type"`
-       EventAt         *time.Time             `json:"event"`
+       EventAt         time.Time              `json:"event"`
+       Summary         string                 `json:"summary"`
         Properties      map[string]interface{} `json:"properties"`
-       CreatedAt       *time.Time             `json:"created_at"`
+       CreatedAt       time.Time              `json:"created_at"`
+       ModifiedAt      time.Time              `json:"modified_at"`
  }
  
  // LogList is an arvados#logList resource.
diff --git a/sdk/go/arvados/vocabulary.go b/sdk/go/arvados/vocabulary.go

index bb1bec789f7f459a3cd49657c4df5337711cce19..bf60a770267e437f7551bfb59fc60e62920fea9c 100644 (file)
--- a/sdk/go/arvados/vocabulary.go
+++ b/sdk/go/arvados/vocabulary.go
@@ -37,6 +37,8 @@ func (v *Vocabulary) systemTagKeys() map[string]bool {
                 "docker-image-repo-tag": true,
                 "filters":               true,
                 "container_request":     true,
+               "cwl_input":             true,
+               "cwl_output":            true,
         }
  }
  
diff --git a/sdk/go/arvados/vocabulary_test.go b/sdk/go/arvados/vocabulary_test.go

index 84b9bf2295e62e6025e0c6f03847c4d3e666a9eb..f31a4f984b36f7c70aa9987017d9596900c91173 100644 (file)
--- a/sdk/go/arvados/vocabulary_test.go
+++ b/sdk/go/arvados/vocabulary_test.go
@@ -238,6 +238,8 @@ func (s *VocabularySuite) TestNewVocabulary(c *check.C) {
                                         "docker-image-repo-tag": true,
                                         "filters":               true,
                                         "container_request":     true,
+                                       "cwl_input":             true,
+                                       "cwl_output":            true,
                                 },
                                 StrictTags: false,
                                 Tags: map[string]VocabularyTag{
diff --git a/sdk/go/arvadostest/api.go b/sdk/go/arvadostest/api.go

index d6da579d6b9ce1323dfbeb9b50f993232822379a..83efd889286d63bc9efd8fd4368850a2870a9d15 100644 (file)
--- a/sdk/go/arvadostest/api.go
+++ b/sdk/go/arvadostest/api.go
@@ -193,6 +193,26 @@ func (as *APIStub) LinkDelete(ctx context.Context, options arvados.DeleteOptions
         as.appendCall(ctx, as.LinkDelete, options)
         return arvados.Link{}, as.Error
  }
+func (as *APIStub) LogCreate(ctx context.Context, options arvados.CreateOptions) (arvados.Log, error) {
+       as.appendCall(ctx, as.LogCreate, options)
+       return arvados.Log{}, as.Error
+}
+func (as *APIStub) LogUpdate(ctx context.Context, options arvados.UpdateOptions) (arvados.Log, error) {
+       as.appendCall(ctx, as.LogUpdate, options)
+       return arvados.Log{}, as.Error
+}
+func (as *APIStub) LogGet(ctx context.Context, options arvados.GetOptions) (arvados.Log, error) {
+       as.appendCall(ctx, as.LogGet, options)
+       return arvados.Log{}, as.Error
+}
+func (as *APIStub) LogList(ctx context.Context, options arvados.ListOptions) (arvados.LogList, error) {
+       as.appendCall(ctx, as.LogList, options)
+       return arvados.LogList{}, as.Error
+}
+func (as *APIStub) LogDelete(ctx context.Context, options arvados.DeleteOptions) (arvados.Log, error) {
+       as.appendCall(ctx, as.LogDelete, options)
+       return arvados.Log{}, as.Error
+}
  func (as *APIStub) SpecimenCreate(ctx context.Context, options arvados.CreateOptions) (arvados.Specimen, error) {
         as.appendCall(ctx, as.SpecimenCreate, options)
         return arvados.Specimen{}, as.Error
diff --git a/sdk/go/arvadostest/db.go b/sdk/go/arvadostest/db.go

index c20f61db26301be6be323d2097be5c55f3d17037..d39f3c6fcbfab8093649ab817612de6bee55b8f7 100644 (file)
--- a/sdk/go/arvadostest/db.go
+++ b/sdk/go/arvadostest/db.go
@@ -5,11 +5,9 @@
  package arvadostest
  
  import (
-       "context"
-
-       "git.arvados.org/arvados.git/lib/ctrlctx"
         "git.arvados.org/arvados.git/sdk/go/arvados"
         "github.com/jmoiron/sqlx"
+
         // sqlx needs lib/pq to talk to PostgreSQL
         _ "github.com/lib/pq"
         "gopkg.in/check.v1"
@@ -21,14 +19,3 @@ func DB(c *check.C, cluster *arvados.Cluster) *sqlx.DB {
         c.Assert(err, check.IsNil)
         return db
  }
-
-// TransactionContext returns a context suitable for running a test
-// case in a new transaction, and a rollback func which the caller
-// should call after the test.
-func TransactionContext(c *check.C, db *sqlx.DB) (ctx context.Context, rollback func()) {
-       tx, err := db.Beginx()
-       c.Assert(err, check.IsNil)
-       return ctrlctx.NewWithTransaction(context.Background(), tx), func() {
-               c.Check(tx.Rollback(), check.IsNil)
-       }
-}
diff --git a/sdk/go/health/aggregator.go b/sdk/go/health/aggregator.go

index b5301dffe006ec280f379d56ca9330818eb029b6..3bf37b12942bebc1b5e83265884f55f4ddd1bcc5 100644 (file)
--- a/sdk/go/health/aggregator.go
+++ b/sdk/go/health/aggregator.go
@@ -135,6 +135,7 @@ type CheckResult struct {
         Response       map[string]interface{} `json:",omitempty"`
         ResponseTime   json.Number
         ClockTime      time.Time
+       Server         string // "Server" header in http response
         Metrics
         respTime time.Duration
  }
@@ -223,7 +224,8 @@ func (agg *Aggregator) ClusterHealth() ClusterHealthResponse {
         for svcName, sh := range resp.Services {
                 switch svcName {
                 case arvados.ServiceNameDispatchCloud,
-                       arvados.ServiceNameDispatchLSF:
+                       arvados.ServiceNameDispatchLSF,
+                       arvados.ServiceNameDispatchSLURM:
                         // ok to not run any given dispatcher
                 case arvados.ServiceNameHealth,
                         arvados.ServiceNameWorkbench1,
@@ -359,6 +361,7 @@ func (agg *Aggregator) ping(target *url.URL) (result CheckResult) {
         }
         result.Health = "OK"
         result.ClockTime, _ = time.Parse(time.RFC1123, resp.Header.Get("Date"))
+       result.Server = resp.Header.Get("Server")
         return
  }
  
@@ -437,7 +440,7 @@ func (ccmd checkCommand) RunCommand(prog string, args []string, stdin io.Reader,
         err := ccmd.run(ctx, prog, args, stdin, stdout, stderr)
         if err != nil {
                 if err != errSilent {
-                       fmt.Fprintln(stdout, err.Error())
+                       fmt.Fprintln(stderr, err.Error())
                 }
                 return 1
         }
@@ -451,7 +454,8 @@ func (ccmd checkCommand) run(ctx context.Context, prog string, args []string, st
         loader.SetupFlags(flags)
         versionFlag := flags.Bool("version", false, "Write version information to stdout and exit 0")
         timeout := flags.Duration("timeout", defaultTimeout.Duration(), "Maximum time to wait for health responses")
-       outputYAML := flags.Bool("yaml", false, "Output full health report in YAML format (default mode shows errors as plain text, is silent on success)")
+       quiet := flags.Bool("quiet", false, "Silent on success (suppress 'health check OK' message on stderr)")
+       outputYAML := flags.Bool("yaml", false, "Output full health report in YAML format (default mode prints 'health check OK' or plain text errors)")
         if ok, _ := cmd.ParseFlags(flags, prog, args, "", stderr); !ok {
                 // cmd.ParseFlags already reported the error
                 return errSilent
@@ -486,11 +490,14 @@ func (ccmd checkCommand) run(ctx context.Context, prog string, args []string, st
         }
         if resp.Health != "OK" {
                 for _, msg := range resp.Errors {
-                       fmt.Fprintln(stdout, msg)
+                       fmt.Fprintln(stderr, msg)
                 }
                 fmt.Fprintln(stderr, "health check failed")
                 return errSilent
         }
+       if !*quiet {
+               fmt.Fprintln(stderr, "health check OK")
+       }
         return nil
  }
  
diff --git a/sdk/go/health/aggregator_test.go b/sdk/go/health/aggregator_test.go

index b1166c27d457317b8a4f6d5b5bcdea69cc6bf273..f76f7b8ea80a45ba9d908e485d2dcae8b9eca300 100644 (file)
--- a/sdk/go/health/aggregator_test.go
+++ b/sdk/go/health/aggregator_test.go
@@ -321,6 +321,13 @@ func (s *AggregatorSuite) TestCheckCommand(c *check.C) {
  
         exitcode := CheckCommand.RunCommand("check", []string{"-config=" + tmpdir + "/config.yml"}, &bytes.Buffer{}, &stdout, &stderr)
         c.Check(exitcode, check.Equals, 0)
+       c.Check(stderr.String(), check.Equals, "health check OK\n")
+       c.Check(stdout.String(), check.Equals, "")
+
+       stdout.Reset()
+       stderr.Reset()
+       exitcode = CheckCommand.RunCommand("check", []string{"-quiet", "-config=" + tmpdir + "/config.yml"}, &bytes.Buffer{}, &stdout, &stderr)
+       c.Check(exitcode, check.Equals, 0)
         c.Check(stderr.String(), check.Equals, "")
         c.Check(stdout.String(), check.Equals, "")
  
diff --git a/sdk/go/keepclient/block_cache.go b/sdk/go/keepclient/block_cache.go

index bac4a24fd5a037d9cdcafb663612677304184c97..89eecc6e276f843d2085b727193c0324ef8d4d03 100644 (file)
--- a/sdk/go/keepclient/block_cache.go
+++ b/sdk/go/keepclient/block_cache.go
@@ -5,6 +5,7 @@
  package keepclient
  
  import (
+       "fmt"
         "io"
         "sort"
         "strconv"
@@ -93,8 +94,11 @@ func (c *BlockCache) Get(kc *KeepClient, locator string) ([]byte, error) {
                                 data = make([]byte, size, bufsize)
                                 _, err = io.ReadFull(rdr, data)
                                 err2 := rdr.Close()
-                               if err == nil {
-                                       err = err2
+                               if err == nil && err2 != nil {
+                                       err = fmt.Errorf("close(): %w", err2)
+                               }
+                               if err != nil {
+                                       err = fmt.Errorf("Get %s: %w", locator, err)
                                 }
                         }
                         c.mtx.Lock()
diff --git a/sdk/perl/.gitignore b/sdk/perl/.gitignore

deleted file mode 100644 (file)

index 7c32f55..0000000
--- a/sdk/perl/.gitignore
+++ /dev/null
@@ -1 +0,0 @@
-install
diff --git a/sdk/perl/Makefile.PL b/sdk/perl/Makefile.PL

deleted file mode 100644 (file)

index ec903f3..0000000
--- a/sdk/perl/Makefile.PL
+++ /dev/null
@@ -1,18 +0,0 @@
-#! /usr/bin/perl
-# Copyright (C) The Arvados Authors. All rights reserved.
-#
-# SPDX-License-Identifier: Apache-2.0
-
-use strict;
-
-use ExtUtils::MakeMaker;
-
-WriteMakefile(
-    NAME            => 'Arvados',
-    VERSION_FROM    => 'lib/Arvados.pm',
-    PREREQ_PM       => {
-        'JSON'     => 0,
-        'LWP'      => 0,
-        'Net::SSL' => 0,
-    },
-);
diff --git a/sdk/perl/lib/Arvados.pm b/sdk/perl/lib/Arvados.pm

deleted file mode 100644 (file)

index 9eb04b4..0000000
--- a/sdk/perl/lib/Arvados.pm
+++ /dev/null
@@ -1,165 +0,0 @@
-# Copyright (C) The Arvados Authors. All rights reserved.
-#
-# SPDX-License-Identifier: Apache-2.0
-
-=head1 NAME
-
-Arvados -- client library for Arvados services
-
-=head1 SYNOPSIS
-
-  use Arvados;
-  $arv = Arvados->new(apiHost => 'arvados.local');
-
-  my $instances = $arv->{'pipeline_instances'}->{'list'}->execute();
-  print "UUID is ", $instances->{'items'}->[0]->{'uuid'}, "\n";
-
-  $uuid = 'eiv0u-arx5y-2c5ovx43zw90gvh';
-  $instance = $arv->{'pipeline_instances'}->{'get'}->execute('uuid' => $uuid);
-  print "ETag is ", $instance->{'etag'}, "\n";
-
-  $instance->{'active'} = 1;
-  $instance->{'name'} = '';
-  $instance->save();
-  print "ETag is ", $instance->{'etag'}, "\n";
-
-=head1 METHODS
-
-=head2 new()
-
- my $whc = Arvados->new( %OPTIONS );
-
-Set up a client and retrieve the schema from the server.
-
-=head3 Options
-
-=over
-
-=item apiHost
-
-Hostname of API discovery service. Default: C<ARVADOS_API_HOST>
-environment variable, or C<arvados>
-
-=item apiProtocolScheme
-
-Protocol scheme. Default: C<ARVADOS_API_PROTOCOL_SCHEME> environment
-variable, or C<https>
-
-=item authToken
-
-Authorization token. Default: C<ARVADOS_API_TOKEN> environment variable
-
-=item apiService
-
-Default C<arvados>
-
-=item apiVersion
-
-Default C<v1>
-
-=back
-
-=cut
-
-package Arvados;
-
-use Net::SSL (); # From Crypt-SSLeay
-BEGIN {
-  $Net::HTTPS::SSL_SOCKET_CLASS = "Net::SSL"; # Force use of Net::SSL
-}
-
-use JSON;
-use Carp;
-use Arvados::ResourceAccessor;
-use Arvados::ResourceMethod;
-use Arvados::ResourceProxy;
-use Arvados::ResourceProxyList;
-use Arvados::Request;
-use Data::Dumper;
-
-$Arvados::VERSION = 0.1;
-
-sub new
-{
-    my $class = shift;
-    my %self = @_;
-    my $self = \%self;
-    bless ($self, $class);
-    return $self->build(@_);
-}
-
-sub build
-{
-    my $self = shift;
-
-    $config = load_config_file("$ENV{HOME}/.config/arvados/settings.conf");
-
-    $self->{'authToken'} ||=
-       $ENV{ARVADOS_API_TOKEN} || $config->{ARVADOS_API_TOKEN};
-
-    $self->{'apiHost'} ||=
-       $ENV{ARVADOS_API_HOST} || $config->{ARVADOS_API_HOST};
-
-    $self->{'noVerifyHostname'} ||=
-       $ENV{ARVADOS_API_HOST_INSECURE};
-
-    $self->{'apiProtocolScheme'} ||=
-       $ENV{ARVADOS_API_PROTOCOL_SCHEME} ||
-       $config->{ARVADOS_API_PROTOCOL_SCHEME};
-
-    $self->{'ua'} = new Arvados::Request;
-
-    my $host = $self->{'apiHost'} || 'arvados';
-    my $service = $self->{'apiService'} || 'arvados';
-    my $version = $self->{'apiVersion'} || 'v1';
-    my $scheme = $self->{'apiProtocolScheme'} || 'https';
-    my $uri = "$scheme://$host/discovery/v1/apis/$service/$version/rest";
-    my $r = $self->new_request;
-    $r->set_uri($uri);
-    $r->set_method("GET");
-    $r->process_request();
-    my $data, $headers;
-    my ($status_number, $status_phrase) = $r->get_status();
-    $data = $r->get_body() if $status_number == 200;
-    $headers = $r->get_headers();
-    if ($data) {
-        my $doc = $self->{'discoveryDocument'} = JSON::decode_json($data);
-        print STDERR Dumper $doc if $ENV{'DEBUG_ARVADOS_API_DISCOVERY'};
-        my $k, $v;
-        while (($k, $v) = each %{$doc->{'resources'}}) {
-            $self->{$k} = Arvados::ResourceAccessor->new($self, $k);
-        }
-    } else {
-        croak "No discovery doc at $uri - $status_number $status_phrase";
-    }
-    $self;
-}
-
-sub new_request
-{
-    my $self = shift;
-    local $ENV{'PERL_LWP_SSL_VERIFY_HOSTNAME'};
-    if ($self->{'noVerifyHostname'} || ($host =~ /\.local$/)) {
-        $ENV{'PERL_LWP_SSL_VERIFY_HOSTNAME'} = 0;
-    }
-    Arvados::Request->new();
-}
-
-sub load_config_file ($)
-{
-    my $config_file = shift;
-    my %config;
-
-    if (open (CONF, $config_file)) {
-       while (<CONF>) {
-           next if /^\s*#/ || /^\s*$/;  # skip comments and blank lines
-           chomp;
-           my ($key, $val) = split /\s*=\s*/, $_, 2;
-           $config{$key} = $val;
-       }
-    }
-    close CONF;
-    return \%config;
-}
-
-1;
diff --git a/sdk/perl/lib/Arvados/Request.pm b/sdk/perl/lib/Arvados/Request.pm

deleted file mode 100644 (file)

index 4523f7d..0000000
--- a/sdk/perl/lib/Arvados/Request.pm
+++ /dev/null
@@ -1,104 +0,0 @@
-# Copyright (C) The Arvados Authors. All rights reserved.
-#
-# SPDX-License-Identifier: Apache-2.0
-
-package Arvados::Request;
-use Data::Dumper;
-use LWP::UserAgent;
-use URI::Escape;
-use Encode;
-use strict;
-@Arvados::HTTP::ISA = qw(LWP::UserAgent);
-
-sub new
-{
-    my $class = shift;
-    my $self = {};
-    bless ($self, $class);
-    return $self->_init(@_);
-}
-
-sub _init
-{
-    my $self = shift;
-    $self->{'ua'} = new LWP::UserAgent(@_);
-    $self->{'ua'}->agent ("libarvados-perl/".$Arvados::VERSION);
-    $self;
-}
-
-sub set_uri
-{
-    my $self = shift;
-    $self->{'uri'} = shift;
-}
-
-sub process_request
-{
-    my $self = shift;
-    my %req;
-    my %content;
-    my $method = $self->{'method'};
-    if ($method eq 'GET' || $method eq 'HEAD') {
-        $content{'_method'} = $method;
-        $method = 'POST';
-    }
-    $req{$method} = $self->{'uri'};
-    $self->{'req'} = new HTTP::Request (%req);
-    $self->{'req'}->header('Authorization' => ('OAuth2 ' . $self->{'authToken'})) if $self->{'authToken'};
-    $self->{'req'}->header('Accept' => 'application/json');
-
-    # allow_nonref lets us encode JSON::true and JSON::false, see #12078
-    my $json = JSON->new->allow_nonref;
-    my ($p, $v);
-    while (($p, $v) = each %{$self->{'queryParams'}}) {
-        $content{$p} = (ref($v) eq "") ? $v : $json->encode($v);
-    }
-    my $content;
-    while (($p, $v) = each %content) {
-        $content .= '&' unless $content eq '';
-        $content .= uri_escape($p);
-        $content .= '=';
-        $content .= uri_escape($v);
-    }
-    $self->{'req'}->content_type("application/x-www-form-urlencoded; charset='utf8'");
-    $self->{'req'}->content(Encode::encode('utf8', $content));
-    $self->{'res'} = $self->{'ua'}->request ($self->{'req'});
-}
-
-sub get_status
-{
-    my $self = shift;
-    return ($self->{'res'}->code(),
-           $self->{'res'}->message());
-}
-
-sub get_body
-{
-    my $self = shift;
-    return $self->{'res'}->content;
-}
-
-sub set_method
-{
-    my $self = shift;
-    $self->{'method'} = shift;
-}
-
-sub set_query_params
-{
-    my $self = shift;
-    $self->{'queryParams'} = shift;
-}
-
-sub set_auth_token
-{
-    my $self = shift;
-    $self->{'authToken'} = shift;
-}
-
-sub get_headers
-{
-    ""
-}
-
-1;
diff --git a/sdk/perl/lib/Arvados/ResourceAccessor.pm b/sdk/perl/lib/Arvados/ResourceAccessor.pm

deleted file mode 100644 (file)

index 8b235fc..0000000
--- a/sdk/perl/lib/Arvados/ResourceAccessor.pm
+++ /dev/null
@@ -1,25 +0,0 @@
-# Copyright (C) The Arvados Authors. All rights reserved.
-#
-# SPDX-License-Identifier: Apache-2.0
-
-package Arvados::ResourceAccessor;
-use Carp;
-use Data::Dumper;
-
-sub new
-{
-    my $class = shift;
-    my $self = {};
-    bless ($self, $class);
-
-    $self->{'api'} = shift;
-    $self->{'resourcesName'} = shift;
-    $self->{'methods'} = $self->{'api'}->{'discoveryDocument'}->{'resources'}->{$self->{'resourcesName'}}->{'methods'};
-    my $method_name, $method;
-    while (($method_name, $method) = each %{$self->{'methods'}}) {
-        $self->{$method_name} = Arvados::ResourceMethod->new($self, $method);
-    }
-    $self;
-}
-
-1;
diff --git a/sdk/perl/lib/Arvados/ResourceMethod.pm b/sdk/perl/lib/Arvados/ResourceMethod.pm

deleted file mode 100644 (file)

index d7e86ff..0000000
--- a/sdk/perl/lib/Arvados/ResourceMethod.pm
+++ /dev/null
@@ -1,124 +0,0 @@
-# Copyright (C) The Arvados Authors. All rights reserved.
-#
-# SPDX-License-Identifier: Apache-2.0
-
-package Arvados::ResourceMethod;
-use Carp;
-use Data::Dumper;
-
-sub new
-{
-    my $class = shift;
-    my $self = {};
-    bless ($self, $class);
-    return $self->_init(@_);
-}
-
-sub _init
-{
-    my $self = shift;
-    $self->{'resourceAccessor'} = shift;
-    $self->{'method'} = shift;
-    return $self;
-}
-
-sub execute
-{
-    my $self = shift;
-    my $method = $self->{'method'};
-
-    my $path = $method->{'path'};
-
-    my %body_params;
-    my %given_params = @_;
-    my %extra_params = %given_params;
-    my %method_params = %{$method->{'parameters'}};
-    if ($method->{'request'}->{'properties'}) {
-        while (my ($prop_name, $prop_value) =
-               each %{$method->{'request'}->{'properties'}}) {
-            if (ref($prop_value) eq 'HASH' && $prop_value->{'$ref'}) {
-                $method_params{$prop_name} = { 'type' => 'object' };
-            }
-        }
-    }
-    while (my ($param_name, $param) = each %method_params) {
-        delete $extra_params{$param_name};
-        if ($param->{'required'} && !exists $given_params{$param_name}) {
-            croak("Required parameter not supplied: $param_name");
-        }
-        elsif ($param->{'location'} eq 'path') {
-            $path =~ s/{\Q$param_name\E}/$given_params{$param_name}/eg;
-        }
-        elsif (!exists $given_params{$param_name}) {
-            ;
-        }
-        elsif ($param->{'type'} eq 'object') {
-            my %param_value;
-            my ($p, $v);
-            if (exists $param->{'properties'}) {
-                while (my ($property_name, $property) =
-                       each %{$param->{'properties'}}) {
-                    # if the discovery doc specifies object structure,
-                    # convert to true/false depending on supplied type
-                    if (!exists $given_params{$param_name}->{$property_name}) {
-                        ;
-                    }
-                    elsif (!defined $given_params{$param_name}->{$property_name}) {
-                        $param_value{$property_name} = JSON::null;
-                    }
-                    elsif ($property->{'type'} eq 'boolean') {
-                        $param_value{$property_name} = $given_params{$param_name}->{$property_name} ? JSON::true : JSON::false;
-                    }
-                    else {
-                        $param_value{$property_name} = $given_params{$param_name}->{$property_name};
-                    }
-                }
-            }
-            else {
-                while (my ($property_name, $property) =
-                       each %{$given_params{$param_name}}) {
-                    if (ref $property eq '' || $property eq undef) {
-                        $param_value{$property_name} = $property;
-                    }
-                    elsif (ref $property eq 'HASH') {
-                        $param_value{$property_name} = {};
-                        while (my ($k, $v) = each %$property) {
-                            $param_value{$property_name}->{$k} = $v;
-                        }
-                    }
-                }
-            }
-            $body_params{$param_name} = \%param_value;
-        } elsif ($param->{'type'} eq 'boolean') {
-            $body_params{$param_name} = $given_params{$param_name} ? JSON::true : JSON::false;
-        } else {
-            $body_params{$param_name} = $given_params{$param_name};
-        }
-    }
-    if (%extra_params) {
-        croak("Unsupported parameter(s) passed to API call /$path: \"" . join('", "', keys %extra_params) . '"');
-    }
-    my $r = $self->{'resourceAccessor'}->{'api'}->new_request;
-    my $base_uri = $self->{'resourceAccessor'}->{'api'}->{'discoveryDocument'}->{'baseUrl'};
-    $base_uri =~ s:/$::;
-    $r->set_uri($base_uri . "/" . $path);
-    $r->set_method($method->{'httpMethod'});
-    $r->set_auth_token($self->{'resourceAccessor'}->{'api'}->{'authToken'});
-    $r->set_query_params(\%body_params) if %body_params;
-    $r->process_request();
-    my $data, $headers;
-    my ($status_number, $status_phrase) = $r->get_status();
-    if ($status_number != 200) {
-        croak("API call /$path failed: $status_number $status_phrase\n". $r->get_body());
-    }
-    $data = $r->get_body();
-    $headers = $r->get_headers();
-    my $result = JSON::decode_json($data);
-    if ($method->{'response'}->{'$ref'} =~ /List$/) {
-        Arvados::ResourceProxyList->new($result, $self->{'resourceAccessor'});
-    } else {
-        Arvados::ResourceProxy->new($result, $self->{'resourceAccessor'});
-    }
-}
-
-1;
diff --git a/sdk/perl/lib/Arvados/ResourceProxy.pm b/sdk/perl/lib/Arvados/ResourceProxy.pm

deleted file mode 100644 (file)

index d3be468..0000000
--- a/sdk/perl/lib/Arvados/ResourceProxy.pm
+++ /dev/null
@@ -1,61 +0,0 @@
-# Copyright (C) The Arvados Authors. All rights reserved.
-#
-# SPDX-License-Identifier: Apache-2.0
-
-package Arvados::ResourceProxy;
-
-sub new
-{
-    my $class = shift;
-    my $self = shift;
-    $self->{'resourceAccessor'} = shift;
-    bless ($self, $class);
-    $self;
-}
-
-sub save
-{
-    my $self = shift;
-    $response = $self->{'resourceAccessor'}->{'update'}->execute('uuid' => $self->{'uuid'}, $self->resource_parameter_name() => $self);
-    foreach my $param (keys %$self) {
-        if (exists $response->{$param}) {
-            $self->{$param} = $response->{$param};
-        }
-    }
-    $self;
-}
-
-sub update_attributes
-{
-    my $self = shift;
-    my %updates = @_;
-    $response = $self->{'resourceAccessor'}->{'update'}->execute('uuid' => $self->{'uuid'}, $self->resource_parameter_name() => \%updates);
-    foreach my $param (keys %updates) {
-        if (exists $response->{$param}) {
-            $self->{$param} = $response->{$param};
-        }
-    }
-    $self;
-}
-
-sub reload
-{
-    my $self = shift;
-    $response = $self->{'resourceAccessor'}->{'get'}->execute('uuid' => $self->{'uuid'});
-    foreach my $param (keys %$self) {
-        if (exists $response->{$param}) {
-            $self->{$param} = $response->{$param};
-        }
-    }
-    $self;
-}
-
-sub resource_parameter_name
-{
-    my $self = shift;
-    my $pname = $self->{'resourceAccessor'}->{'resourcesName'};
-    $pname =~ s/s$//;           # XXX not a very good singularize()
-    $pname;
-}
-
-1;
diff --git a/sdk/perl/lib/Arvados/ResourceProxyList.pm b/sdk/perl/lib/Arvados/ResourceProxyList.pm

deleted file mode 100644 (file)

index 7d8e187..0000000
--- a/sdk/perl/lib/Arvados/ResourceProxyList.pm
+++ /dev/null
@@ -1,24 +0,0 @@
-# Copyright (C) The Arvados Authors. All rights reserved.
-#
-# SPDX-License-Identifier: Apache-2.0
-
-package Arvados::ResourceProxyList;
-
-sub new
-{
-    my $class = shift;
-    my $self = {};
-    bless ($self, $class);
-    $self->_init(@_);
-}
-
-sub _init
-{
-    my $self = shift;
-    $self->{'serverResponse'} = shift;
-    $self->{'resourceAccessor'} = shift;
-    $self->{'items'} = [ map { Arvados::ResourceProxy->new($_, $self->{'resourceAccessor'}) } @{$self->{'serverResponse'}->{'items'}} ];
-    $self;
-}
-
-1;
diff --git a/sdk/python/README.rst b/sdk/python/README.rst

index 570e398a2895ffb61ff021e0f7a618e3c21051d6..5e9bf64c4f724a7cd90f4e8f40ff75ea67efd177 100644 (file)
--- a/sdk/python/README.rst
+++ b/sdk/python/README.rst
@@ -63,5 +63,5 @@ Testing and Development
  This package is one part of the Arvados source package, and it has
  integration tests to check interoperability with other Arvados
  components.  Our `hacking guide
-<https://arvados.org/projects/arvados/wiki/Hacking_Python_SDK>`_
+<https://dev.arvados.org/projects/arvados/wiki/Hacking_Python_SDK>`_
  describes how to set up a development environment and run tests.
diff --git a/sdk/python/arvados/collection.py b/sdk/python/arvados/collection.py

index 998481ab661105b68b0247d1a82c09211fa0d66e..e1138910aebfc501bdfd875c03bd568ea76c3f3e 100644 (file)
--- a/sdk/python/arvados/collection.py
+++ b/sdk/python/arvados/collection.py
@@ -1308,6 +1308,11 @@ class Collection(RichCollectionBase):
          super(Collection, self).__init__(parent)
          self._api_client = api_client
          self._keep_client = keep_client
+
+        # Use the keep client from ThreadSafeApiCache
+        if self._keep_client is None and isinstance(self._api_client, ThreadSafeApiCache):
+            self._keep_client = self._api_client.keep
+
          self._block_manager = block_manager
          self.replication_desired = replication_desired
          self._storage_classes_desired = storage_classes_desired
diff --git a/sdk/python/arvados/diskcache.py b/sdk/python/arvados/diskcache.py

new file mode 100644 (file)

index 0000000..15afa23
--- /dev/null
+++ b/sdk/python/arvados/diskcache.py
@@ -0,0 +1,238 @@
+# Copyright (C) The Arvados Authors. All rights reserved.
+#
+# SPDX-License-Identifier: Apache-2.0
+
+import threading
+import mmap
+import os
+import traceback
+import stat
+import tempfile
+import fcntl
+import time
+import errno
+import logging
+
+_logger = logging.getLogger('arvados.keep')
+
+cacheblock_suffix = ".keepcacheblock"
+
+class DiskCacheSlot(object):
+    __slots__ = ("locator", "ready", "content", "cachedir", "filehandle")
+
+    def __init__(self, locator, cachedir):
+        self.locator = locator
+        self.ready = threading.Event()
+        self.content = None
+        self.cachedir = cachedir
+        self.filehandle = None
+
+    def get(self):
+        self.ready.wait()
+        return self.content
+
+    def set(self, value):
+        tmpfile = None
+        try:
+            if value is None:
+                self.content = None
+                self.ready.set()
+                return
+
+            if len(value) == 0:
+                # Can't mmap a 0 length file
+                self.content = b''
+                self.ready.set()
+                return
+
+            if self.content is not None:
+                # Has been set already
+                self.ready.set()
+                return
+
+            blockdir = os.path.join(self.cachedir, self.locator[0:3])
+            os.makedirs(blockdir, mode=0o700, exist_ok=True)
+
+            final = os.path.join(blockdir, self.locator) + cacheblock_suffix
+
+            self.filehandle = tempfile.NamedTemporaryFile(dir=blockdir, delete=False, prefix="tmp", suffix=cacheblock_suffix)
+            tmpfile = self.filehandle.name
+            os.chmod(tmpfile, stat.S_IRUSR | stat.S_IWUSR)
+
+            # aquire a shared lock, this tells other processes that
+            # we're using this block and to please not delete it.
+            fcntl.flock(self.filehandle, fcntl.LOCK_SH)
+
+            self.filehandle.write(value)
+            self.filehandle.flush()
+            os.rename(tmpfile, final)
+            tmpfile = None
+
+            self.content = mmap.mmap(self.filehandle.fileno(), 0, access=mmap.ACCESS_READ)
+            # only set the event when mmap is successful
+            self.ready.set()
+        finally:
+            if tmpfile is not None:
+                # If the tempfile hasn't been renamed on disk yet, try to delete it.
+                try:
+                    os.remove(tmpfile)
+                except:
+                    pass
+
+    def size(self):
+        if self.content is None:
+            return 0
+        else:
+            return len(self.content)
+
+    def evict(self):
+        if self.content is not None and len(self.content) > 0:
+            # The mmap region might be in use when we decided to evict
+            # it.  This can happen if the cache is too small.
+            #
+            # If we call close() now, it'll throw an error if
+            # something tries to access it.
+            #
+            # However, we don't need to explicitly call mmap.close()
+            #
+            # I confirmed in mmapmodule.c that that both close
+            # and deallocate do the same thing:
+            #
+            # a) close the file descriptor
+            # b) unmap the memory range
+            #
+            # So we can forget it in the cache and delete the file on
+            # disk, and it will tear it down after any other
+            # lingering Python references to the mapped memory are
+            # gone.
+
+            blockdir = os.path.join(self.cachedir, self.locator[0:3])
+            final = os.path.join(blockdir, self.locator) + cacheblock_suffix
+            try:
+                fcntl.flock(self.filehandle, fcntl.LOCK_UN)
+
+                # try to get an exclusive lock, this ensures other
+                # processes are not using the block.  It is
+                # nonblocking and will throw an exception if we
+                # can't get it, which is fine because that means
+                # we just won't try to delete it.
+                #
+                # I should note here, the file locking is not
+                # strictly necessary, we could just remove it and
+                # the kernel would ensure that the underlying
+                # inode remains available as long as other
+                # processes still have the file open.  However, if
+                # you have multiple processes sharing the cache
+                # and deleting each other's files, you'll end up
+                # with a bunch of ghost files that don't show up
+                # in the file system but are still taking up
+                # space, which isn't particularly user friendly.
+                # The locking strategy ensures that cache blocks
+                # in use remain visible.
+                #
+                fcntl.flock(self.filehandle, fcntl.LOCK_EX | fcntl.LOCK_NB)
+
+                os.remove(final)
+                return True
+            except OSError:
+                pass
+            finally:
+                self.filehandle = None
+                self.content = None
+            return False
+
+    @staticmethod
+    def get_from_disk(locator, cachedir):
+        blockdir = os.path.join(cachedir, locator[0:3])
+        final = os.path.join(blockdir, locator) + cacheblock_suffix
+
+        try:
+            filehandle = open(final, "rb")
+
+            # aquire a shared lock, this tells other processes that
+            # we're using this block and to please not delete it.
+            fcntl.flock(filehandle, fcntl.LOCK_SH)
+
+            content = mmap.mmap(filehandle.fileno(), 0, access=mmap.ACCESS_READ)
+            dc = DiskCacheSlot(locator, cachedir)
+            dc.filehandle = filehandle
+            dc.content = content
+            dc.ready.set()
+            return dc
+        except FileNotFoundError:
+            pass
+        except Exception as e:
+            traceback.print_exc()
+
+        return None
+
+    @staticmethod
+    def cache_usage(cachedir):
+        usage = 0
+        for root, dirs, files in os.walk(cachedir):
+            for name in files:
+                if not name.endswith(cacheblock_suffix):
+                    continue
+
+                blockpath = os.path.join(root, name)
+                res = os.stat(blockpath)
+                usage += res.st_size
+        return usage
+
+
+    @staticmethod
+    def init_cache(cachedir, maxslots):
+        #
+        # First check the disk cache works at all by creating a 1 byte cache entry
+        #
+        checkexists = DiskCacheSlot.get_from_disk('0cc175b9c0f1b6a831c399e269772661', cachedir)
+        ds = DiskCacheSlot('0cc175b9c0f1b6a831c399e269772661', cachedir)
+        ds.set(b'a')
+        if checkexists is None:
+            # Don't keep the test entry around unless it existed beforehand.
+            ds.evict()
+
+        # map in all the files in the cache directory, up to max slots.
+        # after max slots, try to delete the excess blocks.
+        #
+        # this gives the calling process ownership of all the blocks
+
+        blocks = []
+        for root, dirs, files in os.walk(cachedir):
+            for name in files:
+                if not name.endswith(cacheblock_suffix):
+                    continue
+
+                blockpath = os.path.join(root, name)
+                res = os.stat(blockpath)
+
+                if len(name) == (32+len(cacheblock_suffix)) and not name.startswith("tmp"):
+                    blocks.append((name[0:32], res.st_atime))
+                elif name.startswith("tmp") and ((time.time() - res.st_mtime) > 60):
+                    # found a temporary file more than 1 minute old,
+                    # try to delete it.
+                    try:
+                        os.remove(blockpath)
+                    except:
+                        pass
+
+        # sort by access time (atime), going from most recently
+        # accessed (highest timestamp) to least recently accessed
+        # (lowest timestamp).
+        blocks.sort(key=lambda x: x[1], reverse=True)
+
+        # Map in all the files we found, up to maxslots, if we exceed
+        # maxslots, start throwing things out.
+        cachelist = []
+        for b in blocks:
+            got = DiskCacheSlot.get_from_disk(b[0], cachedir)
+            if got is None:
+                continue
+            if len(cachelist) < maxslots:
+                cachelist.append(got)
+            else:
+                # we found more blocks than maxslots, try to
+                # throw it out of the cache.
+                got.evict()
+
+        return cachelist
diff --git a/sdk/python/arvados/errors.py b/sdk/python/arvados/errors.py

index 4fe1f76543a356f1c36aafea23efbc5895088c87..15b1f6d4b9883b53c995fd2724a50131b7b28b44 100644 (file)
--- a/sdk/python/arvados/errors.py
+++ b/sdk/python/arvados/errors.py
@@ -82,6 +82,8 @@ class KeepReadError(KeepRequestError):
      pass
  class KeepWriteError(KeepRequestError):
      pass
+class KeepCacheError(KeepRequestError):
+    pass
  class NotFoundError(KeepReadError):
      pass
  class NotImplementedError(Exception):
diff --git a/sdk/python/arvados/keep.py b/sdk/python/arvados/keep.py

index 44e915776734fe87020ba46b5d95d9985f8e8dfe..b9e22748c180190251a266f1d058fad039abae24 100644 (file)
--- a/sdk/python/arvados/keep.py
+++ b/sdk/python/arvados/keep.py
@@ -15,6 +15,7 @@ from builtins import object
  import collections
  import datetime
  import hashlib
+import errno
  import io
  import logging
  import math
@@ -26,8 +27,10 @@ import socket
  import ssl
  import sys
  import threading
+import resource
  from . import timer
  import urllib.parse
+import traceback
  
  if sys.version_info >= (3, 0):
      from io import BytesIO
@@ -39,6 +42,7 @@ import arvados.config as config
  import arvados.errors
  import arvados.retry as retry
  import arvados.util
+import arvados.diskcache
  
  _logger = logging.getLogger('arvados.keep')
  global_client_object = None
@@ -174,11 +178,50 @@ class Keep(object):
          return Keep.global_client_object().put(data, **kwargs)
  
  class KeepBlockCache(object):
-    # Default RAM cache is 256MiB
-    def __init__(self, cache_max=(256 * 1024 * 1024)):
+    def __init__(self, cache_max=0, max_slots=0, disk_cache=False, disk_cache_dir=None):
          self.cache_max = cache_max
          self._cache = []
          self._cache_lock = threading.Lock()
+        self._max_slots = max_slots
+        self._disk_cache = disk_cache
+        self._disk_cache_dir = disk_cache_dir
+
+        if self._disk_cache and self._disk_cache_dir is None:
+            self._disk_cache_dir = os.path.join(os.path.expanduser("~"), ".cache", "arvados", "keep")
+            os.makedirs(self._disk_cache_dir, mode=0o700, exist_ok=True)
+
+        if self._max_slots == 0:
+            if self._disk_cache:
+                # default max slots to half of maximum file handles
+                # NOFILE typically defaults to 1024 on Linux so this
+                # will be 512 slots.
+                self._max_slots = resource.getrlimit(resource.RLIMIT_NOFILE)[0] / 2
+            else:
+                # RAM cache slots
+                self._max_slots = 512
+
+        if self.cache_max == 0:
+            if self._disk_cache:
+                fs = os.statvfs(self._disk_cache_dir)
+                # Calculation of available space incorporates existing cache usage
+                existing_usage = arvados.diskcache.DiskCacheSlot.cache_usage(self._disk_cache_dir)
+                avail = (fs.f_bavail * fs.f_bsize + existing_usage) / 4
+                maxdisk = int((fs.f_blocks * fs.f_bsize) * 0.10)
+                # pick smallest of:
+                # 10% of total disk size
+                # 25% of available space
+                # max_slots * 64 MiB
+                self.cache_max = min(min(maxdisk, avail), (self._max_slots * 64 * 1024 * 1024))
+            else:
+                # 256 MiB in RAM
+                self.cache_max = (256 * 1024 * 1024)
+
+        self.cache_max = max(self.cache_max, 64 * 1024 * 1024)
+
+        if self._disk_cache:
+            self._cache = arvados.diskcache.DiskCacheSlot.init_cache(self._disk_cache_dir, self._max_slots)
+            self.cap_cache()
+
  
      class CacheSlot(object):
          __slots__ = ("locator", "ready", "content")
@@ -202,6 +245,9 @@ class KeepBlockCache(object):
              else:
                  return len(self.content)
  
+        def evict(self):
+            return True
+
      def cap_cache(self):
          '''Cap the cache size to self.cache_max'''
          with self._cache_lock:
@@ -209,12 +255,27 @@ class KeepBlockCache(object):
              # None (that means there was an error reading the block).
              self._cache = [c for c in self._cache if not (c.ready.is_set() and c.content is None)]
              sm = sum([slot.size() for slot in self._cache])
-            while len(self._cache) > 0 and sm > self.cache_max:
+            while len(self._cache) > 0 and (sm > self.cache_max or len(self._cache) > self._max_slots):
                  for i in range(len(self._cache)-1, -1, -1):
+                    # start from the back, find a slot that is a candidate to evict
                      if self._cache[i].ready.is_set():
+                        sz = self._cache[i].size()
+
+                        # If evict returns false it means the
+                        # underlying disk cache couldn't lock the file
+                        # for deletion because another process was using
+                        # it. Don't count it as reducing the amount
+                        # of data in the cache, find something else to
+                        # throw out.
+                        if self._cache[i].evict():
+                            sm -= sz
+
+                        # either way we forget about it.  either the
+                        # other process will delete it, or if we need
+                        # it again and it is still there, we'll find
+                        # it on disk.
                          del self._cache[i]
                          break
-                sm = sum([slot.size() for slot in self._cache])
  
      def _get(self, locator):
          # Test if the locator is already in the cache
@@ -226,6 +287,12 @@ class KeepBlockCache(object):
                      del self._cache[i]
                      self._cache.insert(0, n)
                  return n
+        if self._disk_cache:
+            # see if it exists on disk
+            n = arvados.diskcache.DiskCacheSlot.get_from_disk(locator, self._disk_cache_dir)
+            if n is not None:
+                self._cache.insert(0, n)
+                return n
          return None
  
      def get(self, locator):
@@ -241,10 +308,51 @@ class KeepBlockCache(object):
                  return n, False
              else:
                  # Add a new cache slot for the locator
-                n = KeepBlockCache.CacheSlot(locator)
+                if self._disk_cache:
+                    n = arvados.diskcache.DiskCacheSlot(locator, self._disk_cache_dir)
+                else:
+                    n = KeepBlockCache.CacheSlot(locator)
                  self._cache.insert(0, n)
                  return n, True
  
+    def set(self, slot, blob):
+        try:
+            slot.set(blob)
+            return
+        except OSError as e:
+            if e.errno == errno.ENOMEM:
+                # Reduce max slots to current - 4, cap cache and retry
+                with self._cache_lock:
+                    self._max_slots = max(4, len(self._cache) - 4)
+            elif e.errno == errno.ENOSPC:
+                # Reduce disk max space to current - 256 MiB, cap cache and retry
+                with self._cache_lock:
+                    sm = sum([st.size() for st in self._cache])
+                    self.cache_max = max((256 * 1024 * 1024), sm - (256 * 1024 * 1024))
+            elif e.errno == errno.ENODEV:
+                _logger.error("Unable to use disk cache: The underlying filesystem does not support memory mapping.")
+        except Exception as e:
+            pass
+        finally:
+            # Check if we should evict things from the cache.  Either
+            # because we added a new thing or there was an error and
+            # we possibly adjusted the limits down, so we might need
+            # to push something out.
+            self.cap_cache()
+
+        try:
+            # Only gets here if there was an error the first time. The
+            # exception handler adjusts limits downward in some cases
+            # to free up resources, which would make the operation
+            # succeed.
+            slot.set(blob)
+        except Exception as e:
+            # It failed again.  Give up.
+            slot.set(None)
+            raise arvados.errors.KeepCacheError("Unable to save block %s to disk cache: %s" % (slot.locator, e))
+
+        self.cap_cache()
+
  class Counter(object):
      def __init__(self, v=0):
          self._lk = threading.Lock()
@@ -1170,8 +1278,7 @@ class KeepClient(object):
                  return blob
          finally:
              if slot is not None:
-                slot.set(blob)
-                self.block_cache.cap_cache()
+                self.block_cache.set(slot, blob)
  
          # Q: Including 403 is necessary for the Keep tests to continue
          # passing, but maybe they should expect KeepReadError instead?
diff --git a/sdk/python/arvados/retry.py b/sdk/python/arvados/retry.py

index ea4095930fc78f7cbbb26c49f45a8fa66fbb4081..e93624a5d110fa8f935dde6adc83dca477bd9341 100644 (file)
--- a/sdk/python/arvados/retry.py
+++ b/sdk/python/arvados/retry.py
@@ -1,3 +1,16 @@
+"""Utilities to retry operations.
+
+The core of this module is `RetryLoop`, a utility class to retry operations
+that might fail. It can distinguish between temporary and permanent failures;
+provide exponential backoff; and save a series of results.
+
+It also provides utility functions for common operations with `RetryLoop`:
+
+* `check_http_response_success` can be used as a `RetryLoop` `success_check`
+  for HTTP response codes from the Arvados API server.
+* `retry_method` can decorate methods to provide a default `num_retries`
+  keyword argument.
+"""
  # Copyright (C) The Arvados Authors. All rights reserved.
  #
  # SPDX-License-Identifier: Apache-2.0
@@ -19,7 +32,7 @@ _HTTP_CAN_RETRY = set([408, 409, 422, 423, 500, 502, 503, 504])
  class RetryLoop(object):
      """Coordinate limited retries of code.
  
-    RetryLoop coordinates a loop that runs until it records a
+    `RetryLoop` coordinates a loop that runs until it records a
      successful result or tries too many times, whichever comes first.
      Typical use looks like:
  
@@ -33,30 +46,41 @@ class RetryLoop(object):
                  loop.save_result(result)
          if loop.success():
              return loop.last_result()
+
+    Arguments:
+
+    num_retries: int
+    : The maximum number of times to retry the loop if it
+      doesn't succeed.  This means the loop body could run at most
+      `num_retries + 1` times.
+
+    success_check: Callable
+    : This is a function that will be called each
+      time the loop saves a result.  The function should return
+      `True` if the result indicates the code succeeded, `False` if it
+      represents a permanent failure, and `None` if it represents a
+      temporary failure.  If no function is provided, the loop will
+      end after any result is saved.
+
+    backoff_start: float
+    : The number of seconds that must pass before the loop's second
+      iteration.  Default 0, which disables all waiting.
+
+    backoff_growth: float
+    : The wait time multiplier after each iteration.
+      Default 2 (i.e., double the wait time each time).
+
+    save_results: int
+    : Specify a number to store that many saved results from the loop.
+      These are available through the `results` attribute, oldest first.
+      Default 1.
+
+    max_wait: float
+    : Maximum number of seconds to wait between retries. Default 60.
      """
      def __init__(self, num_retries, success_check=lambda r: True,
                   backoff_start=0, backoff_growth=2, save_results=1,
                   max_wait=60):
-        """Construct a new RetryLoop.
-
-        Arguments:
-        * num_retries: The maximum number of times to retry the loop if it
-          doesn't succeed.  This means the loop could run at most 1+N times.
-        * success_check: This is a function that will be called each
-          time the loop saves a result.  The function should return
-          True if the result indicates loop success, False if it
-          represents a permanent failure state, and None if the loop
-          should continue.  If no function is provided, the loop will
-          end as soon as it records any result.
-        * backoff_start: The number of seconds that must pass before the
-          loop's second iteration.  Default 0, which disables all waiting.
-        * backoff_growth: The wait time multiplier after each iteration.
-          Default 2 (i.e., double the wait time each time).
-        * save_results: Specify a number to save the last N results
-          that the loop recorded.  These records are available through
-          the results attribute, oldest first.  Default 1.
-        * max_wait: Maximum number of seconds to wait between retries.
-        """
          self.tries_left = num_retries + 1
          self.check_result = success_check
          self.backoff_wait = backoff_start
@@ -69,12 +93,24 @@ class RetryLoop(object):
          self._success = None
  
      def __iter__(self):
+        """Return an iterator of retries."""
          return self
  
      def running(self):
+        """Return whether this loop is running.
+
+        Returns `None` if the loop has never run, `True` if it is still running,
+        or `False` if it has stopped—whether that's because it has saved a
+        successful result, a permanent failure, or has run out of retries.
+        """
          return self._running and (self._success is None)
  
      def __next__(self):
+        """Record a loop attempt.
+
+        If the loop is still running, decrements the number of tries left and
+        returns it. Otherwise, raises `StopIteration`.
+        """
          if self._running is None:
              self._running = True
          if (self.tries_left < 1) or not self.running():
@@ -94,8 +130,16 @@ class RetryLoop(object):
          """Record a loop result.
  
          Save the given result, and end the loop if it indicates
-        success or permanent failure.  See __init__'s documentation
-        about success_check to learn how to make that indication.
+        success or permanent failure. See documentation for the `__init__`
+        `success_check` argument to learn how that's indicated.
+
+        Raises `arvados.errors.AssertionError` if called after the loop has
+        already ended.
+
+        Arguments:
+
+        result: Any
+        : The result from this loop attempt to check and save.
          """
          if not self.running():
              raise arvados.errors.AssertionError(
@@ -107,13 +151,17 @@ class RetryLoop(object):
      def success(self):
          """Return the loop's end state.
  
-        Returns True if the loop obtained a successful result, False if it
-        encountered permanent failure, or else None.
+        Returns `True` if the loop recorded a successful result, `False` if it
+        recorded permanent failure, or else `None`.
          """
          return self._success
  
      def last_result(self):
-        """Return the most recent result the loop recorded."""
+        """Return the most recent result the loop saved.
+
+        Raises `arvados.errors.AssertionError` if called before any result has
+        been saved.
+        """
          try:
              return self.results[-1]
          except IndexError:
@@ -121,13 +169,19 @@ class RetryLoop(object):
                  "queried loop results before any were recorded")
  
      def attempts(self):
-        """Return the number of attempts that have been made.
+        """Return the number of results that have been saved.
  
-        Includes successes and failures."""
+        This count includes all kinds of results: success, permanent failure,
+        and temporary failure.
+        """
          return self._attempts
  
      def attempts_str(self):
-        """Human-readable attempts(): 'N attempts' or '1 attempt'"""
+        """Return a human-friendly string counting saved results.
+
+        This method returns '1 attempt' or 'N attempts', where the number
+        in the string is the number of saved results.
+        """
          if self._attempts == 1:
              return '1 attempt'
          else:
@@ -135,23 +189,30 @@ class RetryLoop(object):
  
  
  def check_http_response_success(status_code):
-    """Convert an HTTP status code to a loop control flag.
+    """Convert a numeric HTTP status code to a loop control flag.
  
-    Pass this method a numeric HTTP status code.  It returns True if
-    the code indicates success, None if it indicates temporary
-    failure, and False otherwise.  You can use this as the
-    success_check for a RetryLoop.
+    This method takes a numeric HTTP status code and returns `True` if
+    the code indicates success, `None` if it indicates temporary
+    failure, and `False` otherwise.  You can use this as the
+    `success_check` for a `RetryLoop` that queries the Arvados API server.
+    Specifically:
  
-    Implementation details:
-    * Any 2xx result returns True.
-    * A select few status codes, or any malformed responses, return None.
+    * Any 2xx result returns `True`.
+
+    * A select few status codes, or any malformed responses, return `None`.
        422 Unprocessable Entity is in this category.  This may not meet the
        letter of the HTTP specification, but the Arvados API server will
        use it for various server-side problems like database connection
        errors.
-    * Everything else returns False.  Note that this includes 1xx and
+
+    * Everything else returns `False`.  Note that this includes 1xx and
        3xx status codes.  They don't indicate success, and you can't
        retry those requests verbatim.
+
+    Arguments:
+
+    status_code: int
+    : A numeric HTTP response code
      """
      if status_code in _HTTP_SUCCESSES:
          return True
@@ -166,9 +227,14 @@ def retry_method(orig_func):
      """Provide a default value for a method's num_retries argument.
  
      This is a decorator for instance and class methods that accept a
-    num_retries argument, with a None default.  When the method is called
-    without a value for num_retries, it will be set from the underlying
-    instance or class' num_retries attribute.
+    `num_retries` keyword argument, with a `None` default.  When the method
+    is called without a value for `num_retries`, this decorator will set it
+    from the `num_retries` attribute of the underlying instance or class.
+
+    Arguments:
+
+    orig_func: Callable
+    : A class or instance method that accepts a `num_retries` keyword argument
      """
      @functools.wraps(orig_func)
      def num_retries_setter(self, *args, **kwargs):
diff --git a/sdk/python/setup.py b/sdk/python/setup.py

index d28df099879c907e5bd0bc5bd5498a4ae71fc2a1..1daafc97adcf89e2f6fac2f1899db2003967f25c 100644 (file)
--- a/sdk/python/setup.py
+++ b/sdk/python/setup.py
@@ -48,19 +48,22 @@ setup(name='arvados-python-client',
        install_requires=[
            'ciso8601 >=2.0.0',
            'future',
+          'google-api-core <2.11.0', # 2.11.0rc1 is incompatible with google-auth<2
            'google-api-python-client >=1.6.2, <2',
            'google-auth<2',
            'httplib2 >=0.9.2, <0.20.2',
            'pycurl >=7.19.5.1, <7.45.0',
-          'ruamel.yaml >=0.15.54, <0.17.11',
+          'ruamel.yaml >=0.15.54, <0.17.22',
            'setuptools',
            'ws4py >=0.4.2',
-          'protobuf<4.0.0dev'
+          'protobuf<4.0.0dev',
+          'pyparsing<3',
+          'setuptools>=40.3.0',
        ],
        classifiers=[
            'Programming Language :: Python :: 3',
        ],
        test_suite='tests',
-      tests_require=['pbr<1.7.0', 'mock>=1.0,<4', 'PyYAML'],
+      tests_require=['pbr<1.7.0', 'mock>=1.0,<4', 'PyYAML', 'parameterized'],
        zip_safe=False
        )
diff --git a/sdk/python/tests/arvados_testutil.py b/sdk/python/tests/arvados_testutil.py

index d9b3ca86c4f9055dde2fa9b54ad63ed65d16d755..00356597965fb09e61c12b84781475aa681aa46e 100644 (file)
--- a/sdk/python/tests/arvados_testutil.py
+++ b/sdk/python/tests/arvados_testutil.py
@@ -280,3 +280,30 @@ if sys.version_info < (3, 0):
          return self.assertNotRegexpMatches(*args, **kwargs)
      unittest.TestCase.assertRegex = assertRegex
      unittest.TestCase.assertNotRegex = assertNotRegex
+
+def binary_compare(a, b):
+    if len(a) != len(b):
+        return False
+    for i in range(0, len(a)):
+        if a[i] != b[i]:
+            return False
+    return True
+
+def make_block_cache(disk_cache):
+    if disk_cache:
+        disk_cache_dir = os.path.join(os.path.expanduser("~"), ".cache", "arvados", "keep")
+        shutil.rmtree(disk_cache_dir, ignore_errors=True)
+    block_cache = arvados.keep.KeepBlockCache(disk_cache=disk_cache)
+    return block_cache
+
+
+class DiskCacheBase:
+    def make_block_cache(self, disk_cache):
+        self.disk_cache_dir = tempfile.mkdtemp() if disk_cache else None
+        block_cache = arvados.keep.KeepBlockCache(disk_cache=disk_cache,
+                                                  disk_cache_dir=self.disk_cache_dir)
+        return block_cache
+
+    def tearDown(self):
+        if self.disk_cache_dir:
+            shutil.rmtree(self.disk_cache_dir)
diff --git a/sdk/python/tests/run_test_server.py b/sdk/python/tests/run_test_server.py

index e5d1d8fa380fb49513452d7555618c5410993764..2bb20ca5daec35fe5348369522a106a249959cfe 100644 (file)
--- a/sdk/python/tests/run_test_server.py
+++ b/sdk/python/tests/run_test_server.py
@@ -833,6 +833,9 @@ def setup_config():
                          "GitInternalDir": os.path.join(SERVICES_SRC_DIR, 'api', 'tmp', 'internal.git'),
                      },
                      "LocalKeepBlobBuffersPerVCPU": 0,
+                    "Logging": {
+                        "SweepInterval": 0, # disable, otherwise test cases can't acquire dblock
+                    },
                      "SupportedDockerImageFormats": {"v1": {}},
                      "ShellAccess": {
                          "Admin": True,
diff --git a/sdk/python/tests/test_collections.py b/sdk/python/tests/test_collections.py

index b4849c21ff30909ab3c7f9bb0af8040582e82a58..8986cf225840054bc5cd4161f7edd0b2c3f58b32 100644 (file)
--- a/sdk/python/tests/test_collections.py
+++ b/sdk/python/tests/test_collections.py
@@ -16,11 +16,13 @@ import datetime
  import ciso8601
  import time
  import unittest
+import parameterized
  
  from . import run_test_server
  from arvados._ranges import Range, LocatorAndRange
  from arvados.collection import Collection, CollectionReader
  from . import arvados_testutil as tutil
+from .arvados_testutil import make_block_cache
  
  class TestResumableWriter(arvados.ResumableCollectionWriter):
      KEEP_BLOCK_SIZE = 1024  # PUT to Keep every 1K.
@@ -28,9 +30,10 @@ class TestResumableWriter(arvados.ResumableCollectionWriter):
      def current_state(self):
          return self.dump_state(copy.deepcopy)
  
-
+@parameterized.parameterized_class([{"disk_cache": True}, {"disk_cache": False}])
  class ArvadosCollectionsTest(run_test_server.TestCaseWithServers,
                               tutil.ArvadosBaseTestCase):
+    disk_cache = False
      MAIN_SERVER = {}
  
      @classmethod
@@ -40,7 +43,8 @@ class ArvadosCollectionsTest(run_test_server.TestCaseWithServers,
          run_test_server.authorize_with('admin')
          cls.api_client = arvados.api('v1')
          cls.keep_client = arvados.KeepClient(api_client=cls.api_client,
-                                             local_store=cls.local_store)
+                                             local_store=cls.local_store,
+                                             block_cache=make_block_cache(cls.disk_cache))
  
      def write_foo_bar_baz(self):
          cw = arvados.CollectionWriter(self.api_client)
@@ -896,7 +900,7 @@ class NewCollectionTestCase(unittest.TestCase, CollectionTestMixin):
          c1.save_new()
          loc = c1.manifest_locator()
          c2 = Collection(loc)
-        self.assertEqual(c1.manifest_text, c2.manifest_text)
+        self.assertEqual(c1.manifest_text(strip=True), c2.manifest_text(strip=True))
          self.assertEqual(c1.replication_desired, c2.replication_desired)
  
      def test_replication_desired_not_loaded_if_provided(self):
@@ -905,7 +909,7 @@ class NewCollectionTestCase(unittest.TestCase, CollectionTestMixin):
          c1.save_new()
          loc = c1.manifest_locator()
          c2 = Collection(loc, replication_desired=2)
-        self.assertEqual(c1.manifest_text, c2.manifest_text)
+        self.assertEqual(c1.manifest_text(strip=True), c2.manifest_text(strip=True))
          self.assertNotEqual(c1.replication_desired, c2.replication_desired)
  
      def test_storage_classes_desired_kept_on_load(self):
@@ -914,7 +918,7 @@ class NewCollectionTestCase(unittest.TestCase, CollectionTestMixin):
          c1.save_new()
          loc = c1.manifest_locator()
          c2 = Collection(loc)
-        self.assertEqual(c1.manifest_text, c2.manifest_text)
+        self.assertEqual(c1.manifest_text(strip=True), c2.manifest_text(strip=True))
          self.assertEqual(c1.storage_classes_desired(), c2.storage_classes_desired())
  
      def test_storage_classes_change_after_save(self):
@@ -927,7 +931,7 @@ class NewCollectionTestCase(unittest.TestCase, CollectionTestMixin):
          c2.save(storage_classes=['highIO'])
          self.assertEqual(['highIO'], c2.storage_classes_desired())
          c3 = Collection(loc)
-        self.assertEqual(c1.manifest_text, c3.manifest_text)
+        self.assertEqual(c1.manifest_text(strip=True), c3.manifest_text(strip=True))
          self.assertEqual(['highIO'], c3.storage_classes_desired())
  
      def test_storage_classes_desired_not_loaded_if_provided(self):
@@ -936,7 +940,7 @@ class NewCollectionTestCase(unittest.TestCase, CollectionTestMixin):
          c1.save_new()
          loc = c1.manifest_locator()
          c2 = Collection(loc, storage_classes_desired=['default'])
-        self.assertEqual(c1.manifest_text, c2.manifest_text)
+        self.assertEqual(c1.manifest_text(strip=True), c2.manifest_text(strip=True))
          self.assertNotEqual(c1.storage_classes_desired(), c2.storage_classes_desired())
  
      def test_init_manifest(self):
diff --git a/sdk/python/tests/test_keep_client.py b/sdk/python/tests/test_keep_client.py

index 87e4eefb29d666b4f3fa724151ba8cf268f7d20b..0fe396113644740b37dd2e4292c2a9d56c04605d 100644 (file)
--- a/sdk/python/tests/test_keep_client.py
+++ b/sdk/python/tests/test_keep_client.py
@@ -12,15 +12,21 @@ from builtins import object
  import hashlib
  import mock
  import os
+import errno
  import pycurl
  import random
  import re
+import shutil
  import socket
  import sys
+import stat
+import tempfile
  import time
  import unittest
  import urllib.parse
  
+import parameterized
+
  import arvados
  import arvados.retry
  import arvados.util
@@ -28,17 +34,29 @@ from . import arvados_testutil as tutil
  from . import keepstub
  from . import run_test_server
  
-class KeepTestCase(run_test_server.TestCaseWithServers):
+from .arvados_testutil import DiskCacheBase
+
+@parameterized.parameterized_class([{"disk_cache": True}, {"disk_cache": False}])
+class KeepTestCase(run_test_server.TestCaseWithServers, DiskCacheBase):
+    disk_cache = False
      MAIN_SERVER = {}
      KEEP_SERVER = {}
+    block_cache_test = None
  
      @classmethod
      def setUpClass(cls):
          super(KeepTestCase, cls).setUpClass()
          run_test_server.authorize_with("admin")
          cls.api_client = arvados.api('v1')
+        cls.block_cache_test = DiskCacheBase()
          cls.keep_client = arvados.KeepClient(api_client=cls.api_client,
-                                             proxy='', local_store='')
+                                             proxy='', local_store='',
+                                             block_cache=cls.block_cache_test.make_block_cache(cls.disk_cache))
+
+    @classmethod
+    def tearDownClass(cls):
+        super(KeepTestCase, cls).setUpClass()
+        cls.block_cache_test.tearDown()
  
      def test_KeepBasicRWTest(self):
          self.assertEqual(0, self.keep_client.upload_counter.get())
@@ -52,8 +70,8 @@ class KeepTestCase(run_test_server.TestCaseWithServers):
          self.assertEqual(6, self.keep_client.upload_counter.get())
  
          self.assertEqual(0, self.keep_client.download_counter.get())
-        self.assertEqual(self.keep_client.get(foo_locator),
-                         b'foo',
+        self.assertTrue(tutil.binary_compare(self.keep_client.get(foo_locator),
+                         b'foo'),
                           'wrong content from Keep.get(md5("foo"))')
          self.assertEqual(3, self.keep_client.download_counter.get())
  
@@ -128,13 +146,18 @@ class KeepTestCase(run_test_server.TestCaseWithServers):
                           b'test_head',
                           'wrong content from Keep.get for "test_head"')
  
-class KeepPermissionTestCase(run_test_server.TestCaseWithServers):
+@parameterized.parameterized_class([{"disk_cache": True}, {"disk_cache": False}])
+class KeepPermissionTestCase(run_test_server.TestCaseWithServers, DiskCacheBase):
+    disk_cache = False
      MAIN_SERVER = {}
      KEEP_SERVER = {'blob_signing': True}
  
+    def tearDown(self):
+        DiskCacheBase.tearDown(self)
+
      def test_KeepBasicRWTest(self):
          run_test_server.authorize_with('active')
-        keep_client = arvados.KeepClient()
+        keep_client = arvados.KeepClient(block_cache=self.make_block_cache(self.disk_cache))
          foo_locator = keep_client.put('foo')
          self.assertRegex(
              foo_locator,
@@ -171,8 +194,9 @@ class KeepPermissionTestCase(run_test_server.TestCaseWithServers):
                            keep_client.get,
                            unsigned_bar_locator)
  
-
-class KeepProxyTestCase(run_test_server.TestCaseWithServers):
+@parameterized.parameterized_class([{"disk_cache": True}, {"disk_cache": False}])
+class KeepProxyTestCase(run_test_server.TestCaseWithServers, DiskCacheBase):
+    disk_cache = False
      MAIN_SERVER = {}
      KEEP_SERVER = {}
      KEEP_PROXY_SERVER = {}
@@ -185,12 +209,13 @@ class KeepProxyTestCase(run_test_server.TestCaseWithServers):
  
      def tearDown(self):
          super(KeepProxyTestCase, self).tearDown()
+        DiskCacheBase.tearDown(self)
  
      def test_KeepProxyTest1(self):
          # Will use ARVADOS_KEEP_SERVICES environment variable that
          # is set by setUpClass().
          keep_client = arvados.KeepClient(api_client=self.api_client,
-                                         local_store='')
+                                         local_store='', block_cache=self.make_block_cache(self.disk_cache))
          baz_locator = keep_client.put('baz')
          self.assertRegex(
              baz_locator,
@@ -206,7 +231,8 @@ class KeepProxyTestCase(run_test_server.TestCaseWithServers):
          # existing proxy setting and setting multiple proxies
          arvados.config.settings()['ARVADOS_KEEP_SERVICES'] = 'http://10.0.0.1 https://foo.example.org:1234/'
          keep_client = arvados.KeepClient(api_client=self.api_client,
-                                         local_store='')
+                                         local_store='',
+                                         block_cache=self.make_block_cache(self.disk_cache))
          uris = [x['_service_root'] for x in keep_client._keep_services]
          self.assertEqual(uris, ['http://10.0.0.1/',
                                  'https://foo.example.org:1234/'])
@@ -215,12 +241,18 @@ class KeepProxyTestCase(run_test_server.TestCaseWithServers):
          arvados.config.settings()['ARVADOS_KEEP_SERVICES'] = 'bad.uri.org'
          with self.assertRaises(arvados.errors.ArgumentError):
              keep_client = arvados.KeepClient(api_client=self.api_client,
-                                             local_store='')
+                                             local_store='',
+                                             block_cache=self.make_block_cache(self.disk_cache))
  
+@parameterized.parameterized_class([{"disk_cache": True}, {"disk_cache": False}])
+class KeepClientServiceTestCase(unittest.TestCase, tutil.ApiClientMock, DiskCacheBase):
+    disk_cache = False
+
+    def tearDown(self):
+        DiskCacheBase.tearDown(self)
  
-class KeepClientServiceTestCase(unittest.TestCase, tutil.ApiClientMock):
      def get_service_roots(self, api_client):
-        keep_client = arvados.KeepClient(api_client=api_client)
+        keep_client = arvados.KeepClient(api_client=api_client, block_cache=self.make_block_cache(self.disk_cache))
          services = keep_client.weighted_service_roots(arvados.KeepLocator('0'*32))
          return [urllib.parse.urlparse(url) for url in sorted(services)]
  
@@ -239,7 +271,8 @@ class KeepClientServiceTestCase(unittest.TestCase, tutil.ApiClientMock):
  
      def test_recognize_proxy_services_in_controller_response(self):
          keep_client = arvados.KeepClient(api_client=self.mock_keep_services(
-            service_type='proxy', service_host='localhost', service_port=9, count=1))
+            service_type='proxy', service_host='localhost', service_port=9, count=1),
+                                         block_cache=self.make_block_cache(self.disk_cache))
          try:
              # this will fail, but it ensures we get the service
              # discovery response
@@ -254,7 +287,7 @@ class KeepClientServiceTestCase(unittest.TestCase, tutil.ApiClientMock):
  
          api_client.insecure = True
          with tutil.mock_keep_responses(b'foo', 200) as mock:
-            keep_client = arvados.KeepClient(api_client=api_client)
+            keep_client = arvados.KeepClient(api_client=api_client, block_cache=self.make_block_cache(self.disk_cache))
              keep_client.get('acbd18db4cc2f85cedef654fccc4a4d8+3')
              self.assertEqual(
                  mock.responses[0].getopt(pycurl.SSL_VERIFYPEER),
@@ -265,7 +298,7 @@ class KeepClientServiceTestCase(unittest.TestCase, tutil.ApiClientMock):
  
          api_client.insecure = False
          with tutil.mock_keep_responses(b'foo', 200) as mock:
-            keep_client = arvados.KeepClient(api_client=api_client)
+            keep_client = arvados.KeepClient(api_client=api_client, block_cache=self.make_block_cache(self.disk_cache))
              keep_client.get('acbd18db4cc2f85cedef654fccc4a4d8+3')
              # getopt()==None here means we didn't change the
              # default. If we were using real pycurl instead of a mock,
@@ -286,7 +319,7 @@ class KeepClientServiceTestCase(unittest.TestCase, tutil.ApiClientMock):
          headers = {'X-Keep-Locator':local_loc}
          with tutil.mock_keep_responses('', 200, **headers):
              # Check that the translated locator gets returned
-            keep_client = arvados.KeepClient(api_client=api_client)
+            keep_client = arvados.KeepClient(api_client=api_client, block_cache=self.make_block_cache(self.disk_cache))
              self.assertEqual(local_loc, keep_client.refresh_signature(remote_loc))
              # Check that refresh_signature() uses the correct method and headers
              keep_client._get_or_head = mock.MagicMock()
@@ -305,7 +338,7 @@ class KeepClientServiceTestCase(unittest.TestCase, tutil.ApiClientMock):
          api_client = self.mock_keep_services(count=1)
          force_timeout = socket.timeout("timed out")
          with tutil.mock_keep_responses(force_timeout, 0) as mock:
-            keep_client = arvados.KeepClient(api_client=api_client)
+            keep_client = arvados.KeepClient(api_client=api_client, block_cache=self.make_block_cache(self.disk_cache))
              with self.assertRaises(arvados.errors.KeepReadError):
                  keep_client.get('ffffffffffffffffffffffffffffffff')
              self.assertEqual(
@@ -322,7 +355,7 @@ class KeepClientServiceTestCase(unittest.TestCase, tutil.ApiClientMock):
          api_client = self.mock_keep_services(count=1)
          force_timeout = socket.timeout("timed out")
          with tutil.mock_keep_responses(force_timeout, 0) as mock:
-            keep_client = arvados.KeepClient(api_client=api_client)
+            keep_client = arvados.KeepClient(api_client=api_client, block_cache=self.make_block_cache(self.disk_cache))
              with self.assertRaises(arvados.errors.KeepWriteError):
                  keep_client.put(b'foo')
              self.assertEqual(
@@ -339,7 +372,7 @@ class KeepClientServiceTestCase(unittest.TestCase, tutil.ApiClientMock):
          api_client = self.mock_keep_services(count=1)
          force_timeout = socket.timeout("timed out")
          with tutil.mock_keep_responses(force_timeout, 0) as mock:
-            keep_client = arvados.KeepClient(api_client=api_client)
+            keep_client = arvados.KeepClient(api_client=api_client, block_cache=self.make_block_cache(self.disk_cache))
              with self.assertRaises(arvados.errors.KeepReadError):
                  keep_client.head('ffffffffffffffffffffffffffffffff')
              self.assertEqual(
@@ -356,7 +389,7 @@ class KeepClientServiceTestCase(unittest.TestCase, tutil.ApiClientMock):
          api_client = self.mock_keep_services(service_type='proxy', count=1)
          force_timeout = socket.timeout("timed out")
          with tutil.mock_keep_responses(force_timeout, 0) as mock:
-            keep_client = arvados.KeepClient(api_client=api_client)
+            keep_client = arvados.KeepClient(api_client=api_client, block_cache=self.make_block_cache(self.disk_cache))
              with self.assertRaises(arvados.errors.KeepReadError):
                  keep_client.get('ffffffffffffffffffffffffffffffff')
              self.assertEqual(
@@ -373,7 +406,7 @@ class KeepClientServiceTestCase(unittest.TestCase, tutil.ApiClientMock):
          api_client = self.mock_keep_services(service_type='proxy', count=1)
          force_timeout = socket.timeout("timed out")
          with tutil.mock_keep_responses(force_timeout, 0) as mock:
-            keep_client = arvados.KeepClient(api_client=api_client)
+            keep_client = arvados.KeepClient(api_client=api_client, block_cache=self.make_block_cache(self.disk_cache))
              with self.assertRaises(arvados.errors.KeepReadError):
                  keep_client.head('ffffffffffffffffffffffffffffffff')
              self.assertEqual(
@@ -387,6 +420,7 @@ class KeepClientServiceTestCase(unittest.TestCase, tutil.ApiClientMock):
                  None)
  
      def test_proxy_put_timeout(self):
+        self.disk_cache_dir = None
          api_client = self.mock_keep_services(service_type='proxy', count=1)
          force_timeout = socket.timeout("timed out")
          with tutil.mock_keep_responses(force_timeout, 0) as mock:
@@ -407,7 +441,7 @@ class KeepClientServiceTestCase(unittest.TestCase, tutil.ApiClientMock):
          api_client = mock.MagicMock(name='api_client')
          api_client.keep_services().accessible().execute.side_effect = (
              arvados.errors.ApiError)
-        keep_client = arvados.KeepClient(api_client=api_client)
+        keep_client = arvados.KeepClient(api_client=api_client, block_cache=self.make_block_cache(self.disk_cache))
          with self.assertRaises(exc_class) as err_check:
              getattr(keep_client, verb)('d41d8cd98f00b204e9800998ecf8427e+0')
          self.assertEqual(0, len(err_check.exception.request_errors()))
@@ -427,7 +461,7 @@ class KeepClientServiceTestCase(unittest.TestCase, tutil.ApiClientMock):
              "retry error reporting test", 500, 500, 500, 500, 500, 500, 502, 502)
          with req_mock, tutil.skip_sleep, \
                  self.assertRaises(exc_class) as err_check:
-            keep_client = arvados.KeepClient(api_client=api_client)
+            keep_client = arvados.KeepClient(api_client=api_client, block_cache=self.make_block_cache(self.disk_cache))
              getattr(keep_client, verb)('d41d8cd98f00b204e9800998ecf8427e+0',
                                         num_retries=3)
          self.assertEqual([502, 502], [
@@ -450,7 +484,7 @@ class KeepClientServiceTestCase(unittest.TestCase, tutil.ApiClientMock):
          api_client = self.mock_keep_services(count=3)
          with tutil.mock_keep_responses(data_loc, 200, 500, 500) as req_mock, \
                  self.assertRaises(arvados.errors.KeepWriteError) as exc_check:
-            keep_client = arvados.KeepClient(api_client=api_client)
+            keep_client = arvados.KeepClient(api_client=api_client, block_cache=self.make_block_cache(self.disk_cache))
              keep_client.put(data)
          self.assertEqual(2, len(exc_check.exception.request_errors()))
  
@@ -460,7 +494,7 @@ class KeepClientServiceTestCase(unittest.TestCase, tutil.ApiClientMock):
          api_client = self.mock_keep_services(service_type='proxy', read_only=True, count=1)
          with tutil.mock_keep_responses(data_loc, 200, 500, 500) as req_mock, \
                  self.assertRaises(arvados.errors.KeepWriteError) as exc_check:
-          keep_client = arvados.KeepClient(api_client=api_client)
+          keep_client = arvados.KeepClient(api_client=api_client, block_cache=self.make_block_cache(self.disk_cache))
            keep_client.put(data)
          self.assertEqual(True, ("no Keep services available" in str(exc_check.exception)))
          self.assertEqual(0, len(exc_check.exception.request_errors()))
@@ -469,7 +503,7 @@ class KeepClientServiceTestCase(unittest.TestCase, tutil.ApiClientMock):
          body = b'oddball service get'
          api_client = self.mock_keep_services(service_type='fancynewblobstore')
          with tutil.mock_keep_responses(body, 200):
-            keep_client = arvados.KeepClient(api_client=api_client)
+            keep_client = arvados.KeepClient(api_client=api_client, block_cache=self.make_block_cache(self.disk_cache))
              actual = keep_client.get(tutil.str_keep_locator(body))
          self.assertEqual(body, actual)
  
@@ -478,7 +512,7 @@ class KeepClientServiceTestCase(unittest.TestCase, tutil.ApiClientMock):
          pdh = tutil.str_keep_locator(body)
          api_client = self.mock_keep_services(service_type='fancynewblobstore')
          with tutil.mock_keep_responses(pdh, 200):
-            keep_client = arvados.KeepClient(api_client=api_client)
+            keep_client = arvados.KeepClient(api_client=api_client, block_cache=self.make_block_cache(self.disk_cache))
              actual = keep_client.put(body, copies=1)
          self.assertEqual(pdh, actual)
  
@@ -490,20 +524,25 @@ class KeepClientServiceTestCase(unittest.TestCase, tutil.ApiClientMock):
          headers = {'x-keep-replicas-stored': 3}
          with tutil.mock_keep_responses(pdh, 200, 418, 418, 418,
                                         **headers) as req_mock:
-            keep_client = arvados.KeepClient(api_client=api_client)
+            keep_client = arvados.KeepClient(api_client=api_client, block_cache=self.make_block_cache(self.disk_cache))
              actual = keep_client.put(body, copies=2)
          self.assertEqual(pdh, actual)
          self.assertEqual(1, req_mock.call_count)
  
-
  @tutil.skip_sleep
-class KeepClientCacheTestCase(unittest.TestCase, tutil.ApiClientMock):
+@parameterized.parameterized_class([{"disk_cache": True}, {"disk_cache": False}])
+class KeepClientCacheTestCase(unittest.TestCase, tutil.ApiClientMock, DiskCacheBase):
+    disk_cache = False
+
      def setUp(self):
          self.api_client = self.mock_keep_services(count=2)
-        self.keep_client = arvados.KeepClient(api_client=self.api_client)
+        self.keep_client = arvados.KeepClient(api_client=self.api_client, block_cache=self.make_block_cache(self.disk_cache))
          self.data = b'xyzzy'
          self.locator = '1271ed5ef305aadabc605b1609e24c52'
  
+    def tearDown(self):
+        DiskCacheBase.tearDown(self)
+
      @mock.patch('arvados.KeepClient.KeepService.get')
      def test_get_request_cache(self, get_mock):
          with tutil.mock_keep_responses(self.data, 200, 200):
@@ -524,22 +563,31 @@ class KeepClientCacheTestCase(unittest.TestCase, tutil.ApiClientMock):
      def test_head_and_then_get_return_different_responses(self, get_mock):
          head_resp = None
          get_resp = None
-        get_mock.side_effect = ['first response', 'second response']
+        get_mock.side_effect = [b'first response', b'second response']
          with tutil.mock_keep_responses(self.data, 200, 200):
              head_resp = self.keep_client.head(self.locator)
              get_resp = self.keep_client.get(self.locator)
-        self.assertEqual('first response', head_resp)
+        self.assertEqual(b'first response', head_resp)
          # First reponse was not cached because it was from a HEAD request.
          self.assertNotEqual(head_resp, get_resp)
  
+
+
+
  @tutil.skip_sleep
-class KeepStorageClassesTestCase(unittest.TestCase, tutil.ApiClientMock):
+@parameterized.parameterized_class([{"disk_cache": True}, {"disk_cache": False}])
+class KeepStorageClassesTestCase(unittest.TestCase, tutil.ApiClientMock, DiskCacheBase):
+    disk_cache = False
+
      def setUp(self):
          self.api_client = self.mock_keep_services(count=2)
-        self.keep_client = arvados.KeepClient(api_client=self.api_client)
+        self.keep_client = arvados.KeepClient(api_client=self.api_client, block_cache=self.make_block_cache(self.disk_cache))
          self.data = b'xyzzy'
          self.locator = '1271ed5ef305aadabc605b1609e24c52'
  
+    def tearDown(self):
+        DiskCacheBase.tearDown(self)
+
      def test_multiple_default_storage_classes_req_header(self):
          api_mock = self.api_client_mock()
          api_mock.config.return_value = {
@@ -550,7 +598,7 @@ class KeepStorageClassesTestCase(unittest.TestCase, tutil.ApiClientMock):
              }
          }
          api_client = self.mock_keep_services(api_mock=api_mock, count=2)
-        keep_client = arvados.KeepClient(api_client=api_client)
+        keep_client = arvados.KeepClient(api_client=api_client, block_cache=self.make_block_cache(self.disk_cache))
          resp_hdr = {
              'x-keep-storage-classes-confirmed': 'foo=1, bar=1',
              'x-keep-replicas-stored': 1
@@ -644,10 +692,13 @@ class KeepStorageClassesTestCase(unittest.TestCase, tutil.ApiClientMock):
                      self.keep_client.put(self.data, copies=w_copies, classes=w_classes)
  
  @tutil.skip_sleep
-class KeepXRequestIdTestCase(unittest.TestCase, tutil.ApiClientMock):
+@parameterized.parameterized_class([{"disk_cache": True}, {"disk_cache": False}])
+class KeepXRequestIdTestCase(unittest.TestCase, tutil.ApiClientMock, DiskCacheBase):
+    disk_cache = False
+
      def setUp(self):
          self.api_client = self.mock_keep_services(count=2)
-        self.keep_client = arvados.KeepClient(api_client=self.api_client)
+        self.keep_client = arvados.KeepClient(api_client=self.api_client, block_cache=self.make_block_cache(self.disk_cache))
          self.data = b'xyzzy'
          self.locator = '1271ed5ef305aadabc605b1609e24c52'
          self.test_id = arvados.util.new_request_id()
@@ -657,6 +708,9 @@ class KeepXRequestIdTestCase(unittest.TestCase, tutil.ApiClientMock):
          # id='123456789'>:
          self.api_client.request_id = None
  
+    def tearDown(self):
+        DiskCacheBase.tearDown(self)
+
      def test_default_to_api_client_request_id(self):
          self.api_client.request_id = self.test_id
          with tutil.mock_keep_responses(self.locator, 200, 200) as mock:
@@ -732,7 +786,9 @@ class KeepXRequestIdTestCase(unittest.TestCase, tutil.ApiClientMock):
  
  
  @tutil.skip_sleep
-class KeepClientRendezvousTestCase(unittest.TestCase, tutil.ApiClientMock):
+#@parameterized.parameterized_class([{"disk_cache": True}, {"disk_cache": False}])
+class KeepClientRendezvousTestCase(unittest.TestCase, tutil.ApiClientMock, DiskCacheBase):
+    disk_cache = False
  
      def setUp(self):
          # expected_order[i] is the probe order for
@@ -755,7 +811,10 @@ class KeepClientRendezvousTestCase(unittest.TestCase, tutil.ApiClientMock):
              hashlib.md5(self.blocks[x]).hexdigest()
              for x in range(len(self.expected_order))]
          self.api_client = self.mock_keep_services(count=self.services)
-        self.keep_client = arvados.KeepClient(api_client=self.api_client)
+        self.keep_client = arvados.KeepClient(api_client=self.api_client, block_cache=self.make_block_cache(self.disk_cache))
+
+    def tearDown(self):
+        DiskCacheBase.tearDown(self)
  
      def test_weighted_service_roots_against_reference_set(self):
          # Confirm weighted_service_roots() returns the correct order
@@ -828,12 +887,12 @@ class KeepClientRendezvousTestCase(unittest.TestCase, tutil.ApiClientMock):
              hashlib.md5("{:064x}".format(x).encode()).hexdigest() for x in range(100)]
          initial_services = 12
          self.api_client = self.mock_keep_services(count=initial_services)
-        self.keep_client = arvados.KeepClient(api_client=self.api_client)
+        self.keep_client = arvados.KeepClient(api_client=self.api_client, block_cache=self.make_block_cache(self.disk_cache))
          probes_before = [
              self.keep_client.weighted_service_roots(arvados.KeepLocator(hash)) for hash in hashes]
          for added_services in range(1, 12):
              api_client = self.mock_keep_services(count=initial_services+added_services)
-            keep_client = arvados.KeepClient(api_client=api_client)
+            keep_client = arvados.KeepClient(api_client=api_client, block_cache=self.make_block_cache(self.disk_cache))
              total_penalty = 0
              for hash_index in range(len(hashes)):
                  probe_after = keep_client.weighted_service_roots(
@@ -869,7 +928,7 @@ class KeepClientRendezvousTestCase(unittest.TestCase, tutil.ApiClientMock):
          # Arbitrary port number:
          aport = random.randint(1024,65535)
          api_client = self.mock_keep_services(service_port=aport, count=self.services)
-        keep_client = arvados.KeepClient(api_client=api_client)
+        keep_client = arvados.KeepClient(api_client=api_client, block_cache=self.make_block_cache(self.disk_cache))
          with mock.patch('pycurl.Curl') as curl_mock, \
               self.assertRaises(exc_class) as err_check:
              curl_mock.return_value = tutil.FakeCurl.make(code=500, body=b'')
@@ -885,8 +944,10 @@ class KeepClientRendezvousTestCase(unittest.TestCase, tutil.ApiClientMock):
      def test_put_error_shows_probe_order(self):
          self.check_64_zeros_error_order('put', arvados.errors.KeepWriteError)
  
+@parameterized.parameterized_class([{"disk_cache": True}, {"disk_cache": False}])
+class KeepClientTimeout(keepstub.StubKeepServers, unittest.TestCase, DiskCacheBase):
+    disk_cache = False
  
-class KeepClientTimeout(keepstub.StubKeepServers, unittest.TestCase):
      # BANDWIDTH_LOW_LIM must be less than len(DATA) so we can transfer
      # 1s worth of data and then trigger bandwidth errors before running
      # out of data.
@@ -894,6 +955,9 @@ class KeepClientTimeout(keepstub.StubKeepServers, unittest.TestCase):
      BANDWIDTH_LOW_LIM = 1024
      TIMEOUT_TIME = 1.0
  
+    def tearDown(self):
+        DiskCacheBase.tearDown(self)
+
      class assertTakesBetween(unittest.TestCase):
          def __init__(self, tmin, tmax):
              self.tmin = tmin
@@ -923,7 +987,7 @@ class KeepClientTimeout(keepstub.StubKeepServers, unittest.TestCase):
      def keepClient(self, timeouts=(0.1, TIMEOUT_TIME, BANDWIDTH_LOW_LIM)):
          return arvados.KeepClient(
              api_client=self.api_client,
-            timeout=timeouts)
+            timeout=timeouts, block_cache=self.make_block_cache(self.disk_cache))
  
      def test_timeout_slow_connect(self):
          # Can't simulate TCP delays with our own socket. Leave our
@@ -1027,8 +1091,13 @@ class KeepClientTimeout(keepstub.StubKeepServers, unittest.TestCase):
              with self.assertRaises(arvados.errors.KeepWriteError):
                  kc.put(self.DATA, copies=1, num_retries=0)
  
+@parameterized.parameterized_class([{"disk_cache": True}, {"disk_cache": False}])
+class KeepClientGatewayTestCase(unittest.TestCase, tutil.ApiClientMock, DiskCacheBase):
+    disk_cache = False
+
+    def tearDown(self):
+        DiskCacheBase.tearDown(self)
  
-class KeepClientGatewayTestCase(unittest.TestCase, tutil.ApiClientMock):
      def mock_disks_and_gateways(self, disks=3, gateways=1):
          self.gateways = [{
                  'uuid': 'zzzzz-bi6l4-gateway{:08d}'.format(i),
@@ -1043,7 +1112,7 @@ class KeepClientGatewayTestCase(unittest.TestCase, tutil.ApiClientMock):
              for gw in self.gateways]
          self.api_client = self.mock_keep_services(
              count=disks, additional_services=self.gateways)
-        self.keepClient = arvados.KeepClient(api_client=self.api_client)
+        self.keepClient = arvados.KeepClient(api_client=self.api_client, block_cache=self.make_block_cache(self.disk_cache))
  
      @mock.patch('pycurl.Curl')
      def test_get_with_gateway_hint_first(self, MockCurl):
@@ -1124,8 +1193,9 @@ class KeepClientGatewayTestCase(unittest.TestCase, tutil.ApiClientMock):
          self.assertEqual('https://keep.xyzzy.arvadosapi.com/'+locator,
                           MockCurl.return_value.getopt(pycurl.URL).decode())
  
-
  class KeepClientRetryTestMixin(object):
+    disk_cache = False
+
      # Testing with a local Keep store won't exercise the retry behavior.
      # Instead, our strategy is:
      # * Create a client with one proxy specified (pointed at a black
@@ -1150,6 +1220,7 @@ class KeepClientRetryTestMixin(object):
      def new_client(self, **caller_kwargs):
          kwargs = self.client_kwargs.copy()
          kwargs.update(caller_kwargs)
+        kwargs['block_cache'] = self.make_block_cache(self.disk_cache)
          return arvados.KeepClient(**kwargs)
  
      def run_method(self, *args, **kwargs):
@@ -1199,12 +1270,16 @@ class KeepClientRetryTestMixin(object):
  
  
  @tutil.skip_sleep
-class KeepClientRetryGetTestCase(KeepClientRetryTestMixin, unittest.TestCase):
+@parameterized.parameterized_class([{"disk_cache": True}, {"disk_cache": False}])
+class KeepClientRetryGetTestCase(KeepClientRetryTestMixin, unittest.TestCase, DiskCacheBase):
      DEFAULT_EXPECT = KeepClientRetryTestMixin.TEST_DATA
      DEFAULT_EXCEPTION = arvados.errors.KeepReadError
      HINTED_LOCATOR = KeepClientRetryTestMixin.TEST_LOCATOR + '+K@xyzzy'
      TEST_PATCHER = staticmethod(tutil.mock_keep_responses)
  
+    def tearDown(self):
+        DiskCacheBase.tearDown(self)
+
      def run_method(self, locator=KeepClientRetryTestMixin.TEST_LOCATOR,
                     *args, **kwargs):
          return self.new_client().get(locator, *args, **kwargs)
@@ -1243,12 +1318,16 @@ class KeepClientRetryGetTestCase(KeepClientRetryTestMixin, unittest.TestCase):
              self.check_success(locator=self.HINTED_LOCATOR)
  
  @tutil.skip_sleep
-class KeepClientRetryHeadTestCase(KeepClientRetryTestMixin, unittest.TestCase):
+@parameterized.parameterized_class([{"disk_cache": True}, {"disk_cache": False}])
+class KeepClientRetryHeadTestCase(KeepClientRetryTestMixin, unittest.TestCase, DiskCacheBase):
      DEFAULT_EXPECT = True
      DEFAULT_EXCEPTION = arvados.errors.KeepReadError
      HINTED_LOCATOR = KeepClientRetryTestMixin.TEST_LOCATOR + '+K@xyzzy'
      TEST_PATCHER = staticmethod(tutil.mock_keep_responses)
  
+    def tearDown(self):
+        DiskCacheBase.tearDown(self)
+
      def run_method(self, locator=KeepClientRetryTestMixin.TEST_LOCATOR,
                     *args, **kwargs):
          return self.new_client().head(locator, *args, **kwargs)
@@ -1281,11 +1360,15 @@ class KeepClientRetryHeadTestCase(KeepClientRetryTestMixin, unittest.TestCase):
              self.check_success(locator=self.HINTED_LOCATOR)
  
  @tutil.skip_sleep
-class KeepClientRetryPutTestCase(KeepClientRetryTestMixin, unittest.TestCase):
+@parameterized.parameterized_class([{"disk_cache": True}, {"disk_cache": False}])
+class KeepClientRetryPutTestCase(KeepClientRetryTestMixin, unittest.TestCase, DiskCacheBase):
      DEFAULT_EXPECT = KeepClientRetryTestMixin.TEST_LOCATOR
      DEFAULT_EXCEPTION = arvados.errors.KeepWriteError
      TEST_PATCHER = staticmethod(tutil.mock_keep_responses)
  
+    def tearDown(self):
+        DiskCacheBase.tearDown(self)
+
      def run_method(self, data=KeepClientRetryTestMixin.TEST_DATA,
                     copies=1, *args, **kwargs):
          return self.new_client().put(data, copies, *args, **kwargs)
@@ -1369,13 +1452,19 @@ class AvoidOverreplication(unittest.TestCase, tutil.ApiClientMock):
  
  
  @tutil.skip_sleep
-class RetryNeedsMultipleServices(unittest.TestCase, tutil.ApiClientMock):
+@parameterized.parameterized_class([{"disk_cache": True}, {"disk_cache": False}])
+class RetryNeedsMultipleServices(unittest.TestCase, tutil.ApiClientMock, DiskCacheBase):
+    block_cache = False
+
      # Test put()s that need two distinct servers to succeed, possibly
      # requiring multiple passes through the retry loop.
  
      def setUp(self):
          self.api_client = self.mock_keep_services(count=2)
-        self.keep_client = arvados.KeepClient(api_client=self.api_client)
+        self.keep_client = arvados.KeepClient(api_client=self.api_client, block_cache=self.make_block_cache(self.disk_cache))
+
+    def tearDown(self):
+        DiskCacheBase.tearDown(self)
  
      def test_success_after_exception(self):
          with tutil.mock_keep_responses(
@@ -1402,7 +1491,13 @@ class RetryNeedsMultipleServices(unittest.TestCase, tutil.ApiClientMock):
                  self.keep_client.put('foo', num_retries=1, copies=2)
          self.assertEqual(2, req_mock.call_count)
  
-class KeepClientAPIErrorTest(unittest.TestCase):
+@parameterized.parameterized_class([{"disk_cache": True}, {"disk_cache": False}])
+class KeepClientAPIErrorTest(unittest.TestCase, DiskCacheBase):
+    disk_cache = False
+
+    def tearDown(self):
+        DiskCacheBase.tearDown(self)
+
      def test_api_fail(self):
          class ApiMock(object):
              def __getattr__(self, r):
@@ -1415,7 +1510,8 @@ class KeepClientAPIErrorTest(unittest.TestCase):
                  else:
                      raise arvados.errors.KeepReadError()
          keep_client = arvados.KeepClient(api_client=ApiMock(),
-                                             proxy='', local_store='')
+                                         proxy='', local_store='',
+                                         block_cache=self.make_block_cache(self.disk_cache))
  
          # The bug this is testing for is that if an API (not
          # keepstore) exception is thrown as part of a get(), the next
@@ -1429,3 +1525,232 @@ class KeepClientAPIErrorTest(unittest.TestCase):
              keep_client.get("acbd18db4cc2f85cedef654fccc4a4d8+3")
          with self.assertRaises(arvados.errors.KeepReadError):
              keep_client.get("acbd18db4cc2f85cedef654fccc4a4d8+3")
+
+
+class KeepDiskCacheTestCase(unittest.TestCase, tutil.ApiClientMock):
+    def setUp(self):
+        self.api_client = self.mock_keep_services(count=2)
+        self.data = b'xyzzy'
+        self.locator = '1271ed5ef305aadabc605b1609e24c52'
+        self.disk_cache_dir = tempfile.mkdtemp()
+
+    def tearDown(self):
+        shutil.rmtree(self.disk_cache_dir)
+
+
+    @mock.patch('arvados.KeepClient.KeepService.get')
+    def test_disk_cache_read(self, get_mock):
+        # confirm it finds an existing cache block when the cache is
+        # initialized.
+
+        os.makedirs(os.path.join(self.disk_cache_dir, self.locator[0:3]))
+        with open(os.path.join(self.disk_cache_dir, self.locator[0:3], self.locator+".keepcacheblock"), "wb") as f:
+            f.write(self.data)
+
+        # block cache should have found the existing block
+        block_cache = arvados.keep.KeepBlockCache(disk_cache=True,
+                                                  disk_cache_dir=self.disk_cache_dir)
+        keep_client = arvados.KeepClient(api_client=self.api_client, block_cache=block_cache)
+
+        self.assertTrue(tutil.binary_compare(keep_client.get(self.locator), self.data))
+
+        get_mock.assert_not_called()
+
+
+    @mock.patch('arvados.KeepClient.KeepService.get')
+    def test_disk_cache_share(self, get_mock):
+        # confirm it finds a cache block written after the disk cache
+        # was initialized.
+
+        block_cache = arvados.keep.KeepBlockCache(disk_cache=True,
+                                                  disk_cache_dir=self.disk_cache_dir)
+        keep_client = arvados.KeepClient(api_client=self.api_client, block_cache=block_cache)
+
+        os.makedirs(os.path.join(self.disk_cache_dir, self.locator[0:3]))
+        with open(os.path.join(self.disk_cache_dir, self.locator[0:3], self.locator+".keepcacheblock"), "wb") as f:
+            f.write(self.data)
+
+        # when we try to get the block, it'll check the disk and find it.
+        self.assertTrue(tutil.binary_compare(keep_client.get(self.locator), self.data))
+
+        get_mock.assert_not_called()
+
+
+    def test_disk_cache_write(self):
+        # confirm the cache block was created
+
+        block_cache = arvados.keep.KeepBlockCache(disk_cache=True,
+                                                  disk_cache_dir=self.disk_cache_dir)
+        keep_client = arvados.KeepClient(api_client=self.api_client, block_cache=block_cache)
+
+        with tutil.mock_keep_responses(self.data, 200) as mock:
+            self.assertTrue(tutil.binary_compare(keep_client.get(self.locator), self.data))
+
+        self.assertIsNotNone(keep_client.get_from_cache(self.locator))
+
+        with open(os.path.join(self.disk_cache_dir, self.locator[0:3], self.locator+".keepcacheblock"), "rb") as f:
+            self.assertTrue(tutil.binary_compare(f.read(), self.data))
+
+
+    def test_disk_cache_clean(self):
+        # confirm that a tmp file in the cache is cleaned up
+
+        os.makedirs(os.path.join(self.disk_cache_dir, self.locator[0:3]))
+        with open(os.path.join(self.disk_cache_dir, self.locator[0:3], "tmpXYZABC.keepcacheblock"), "wb") as f:
+            f.write(b"abc1")
+
+        with open(os.path.join(self.disk_cache_dir, self.locator[0:3], "tmpXYZABC"), "wb") as f:
+            f.write(b"abc2")
+
+        with open(os.path.join(self.disk_cache_dir, self.locator[0:3], "XYZABC"), "wb") as f:
+            f.write(b"abc3")
+
+        self.assertTrue(os.path.exists(os.path.join(self.disk_cache_dir, self.locator[0:3], "tmpXYZABC.keepcacheblock")))
+        self.assertTrue(os.path.exists(os.path.join(self.disk_cache_dir, self.locator[0:3], "tmpXYZABC")))
+        self.assertTrue(os.path.exists(os.path.join(self.disk_cache_dir, self.locator[0:3], "XYZABC")))
+
+        block_cache = arvados.keep.KeepBlockCache(disk_cache=True,
+                                                  disk_cache_dir=self.disk_cache_dir)
+
+        # The tmp still hasn't been deleted because it was created in the last 60 seconds
+        self.assertTrue(os.path.exists(os.path.join(self.disk_cache_dir, self.locator[0:3], "tmpXYZABC.keepcacheblock")))
+        self.assertTrue(os.path.exists(os.path.join(self.disk_cache_dir, self.locator[0:3], "tmpXYZABC")))
+        self.assertTrue(os.path.exists(os.path.join(self.disk_cache_dir, self.locator[0:3], "XYZABC")))
+
+        # Set the mtime to 61s in the past
+        os.utime(os.path.join(self.disk_cache_dir, self.locator[0:3], "tmpXYZABC.keepcacheblock"), times=(time.time()-61, time.time()-61))
+        os.utime(os.path.join(self.disk_cache_dir, self.locator[0:3], "tmpXYZABC"), times=(time.time()-61, time.time()-61))
+        os.utime(os.path.join(self.disk_cache_dir, self.locator[0:3], "XYZABC"), times=(time.time()-61, time.time()-61))
+
+        block_cache2 = arvados.keep.KeepBlockCache(disk_cache=True,
+                                                   disk_cache_dir=self.disk_cache_dir)
+
+        # Tmp should be gone but the other ones are safe.
+        self.assertFalse(os.path.exists(os.path.join(self.disk_cache_dir, self.locator[0:3], "tmpXYZABC.keepcacheblock")))
+        self.assertTrue(os.path.exists(os.path.join(self.disk_cache_dir, self.locator[0:3], "tmpXYZABC")))
+        self.assertTrue(os.path.exists(os.path.join(self.disk_cache_dir, self.locator[0:3], "XYZABC")))
+
+
+    @mock.patch('arvados.KeepClient.KeepService.get')
+    def test_disk_cache_cap(self, get_mock):
+        # confirm that the cache is kept to the desired limit
+
+        os.makedirs(os.path.join(self.disk_cache_dir, self.locator[0:3]))
+        with open(os.path.join(self.disk_cache_dir, self.locator[0:3], self.locator+".keepcacheblock"), "wb") as f:
+            f.write(self.data)
+
+        os.makedirs(os.path.join(self.disk_cache_dir, "acb"))
+        with open(os.path.join(self.disk_cache_dir, "acb", "acbd18db4cc2f85cedef654fccc4a4d8.keepcacheblock"), "wb") as f:
+            f.write(b"foo")
+
+        self.assertTrue(os.path.exists(os.path.join(self.disk_cache_dir, self.locator[0:3], self.locator+".keepcacheblock")))
+        self.assertTrue(os.path.exists(os.path.join(self.disk_cache_dir, "acb", "acbd18db4cc2f85cedef654fccc4a4d8.keepcacheblock")))
+
+        block_cache = arvados.keep.KeepBlockCache(disk_cache=True,
+                                                   disk_cache_dir=self.disk_cache_dir,
+                                                   max_slots=1)
+
+        self.assertFalse(os.path.exists(os.path.join(self.disk_cache_dir, self.locator[0:3], self.locator+".keepcacheblock")))
+        self.assertTrue(os.path.exists(os.path.join(self.disk_cache_dir, "acb", "acbd18db4cc2f85cedef654fccc4a4d8.keepcacheblock")))
+
+
+    @mock.patch('arvados.KeepClient.KeepService.get')
+    def test_disk_cache_share(self, get_mock):
+        # confirm that a second cache doesn't delete files that belong to the first cache.
+
+        os.makedirs(os.path.join(self.disk_cache_dir, self.locator[0:3]))
+        with open(os.path.join(self.disk_cache_dir, self.locator[0:3], self.locator+".keepcacheblock"), "wb") as f:
+            f.write(self.data)
+
+        os.makedirs(os.path.join(self.disk_cache_dir, "acb"))
+        with open(os.path.join(self.disk_cache_dir, "acb", "acbd18db4cc2f85cedef654fccc4a4d8.keepcacheblock"), "wb") as f:
+            f.write(b"foo")
+
+        self.assertTrue(os.path.exists(os.path.join(self.disk_cache_dir, self.locator[0:3], self.locator+".keepcacheblock")))
+        self.assertTrue(os.path.exists(os.path.join(self.disk_cache_dir, "acb", "acbd18db4cc2f85cedef654fccc4a4d8.keepcacheblock")))
+
+        block_cache = arvados.keep.KeepBlockCache(disk_cache=True,
+                                                   disk_cache_dir=self.disk_cache_dir,
+                                                   max_slots=2)
+
+        self.assertTrue(os.path.exists(os.path.join(self.disk_cache_dir, self.locator[0:3], self.locator+".keepcacheblock")))
+        self.assertTrue(os.path.exists(os.path.join(self.disk_cache_dir, "acb", "acbd18db4cc2f85cedef654fccc4a4d8.keepcacheblock")))
+
+        block_cache2 = arvados.keep.KeepBlockCache(disk_cache=True,
+                                                   disk_cache_dir=self.disk_cache_dir,
+                                                   max_slots=1)
+
+        self.assertTrue(os.path.exists(os.path.join(self.disk_cache_dir, self.locator[0:3], self.locator+".keepcacheblock")))
+        self.assertTrue(os.path.exists(os.path.join(self.disk_cache_dir, "acb", "acbd18db4cc2f85cedef654fccc4a4d8.keepcacheblock")))
+
+
+
+    def test_disk_cache_error(self):
+        os.chmod(self.disk_cache_dir, stat.S_IRUSR)
+
+        # Fail during cache initialization.
+        with self.assertRaises(OSError):
+            block_cache = arvados.keep.KeepBlockCache(disk_cache=True,
+                                                      disk_cache_dir=self.disk_cache_dir)
+
+
+    def test_disk_cache_write_error(self):
+        block_cache = arvados.keep.KeepBlockCache(disk_cache=True,
+                                                  disk_cache_dir=self.disk_cache_dir)
+
+        keep_client = arvados.KeepClient(api_client=self.api_client, block_cache=block_cache)
+
+        # Make the cache dir read-only
+        os.makedirs(os.path.join(self.disk_cache_dir, self.locator[0:3]))
+        os.chmod(os.path.join(self.disk_cache_dir, self.locator[0:3]), stat.S_IRUSR)
+
+        # Cache fails
+        with self.assertRaises(arvados.errors.KeepCacheError):
+            with tutil.mock_keep_responses(self.data, 200) as mock:
+                keep_client.get(self.locator)
+
+
+    @mock.patch('mmap.mmap')
+    def test_disk_cache_retry_write_error(self, mockmmap):
+        block_cache = arvados.keep.KeepBlockCache(disk_cache=True,
+                                                  disk_cache_dir=self.disk_cache_dir)
+
+        keep_client = arvados.KeepClient(api_client=self.api_client, block_cache=block_cache)
+
+        mockmmap.side_effect = (OSError(errno.ENOSPC, "no space"), self.data)
+
+        cache_max_before = block_cache.cache_max
+
+        with tutil.mock_keep_responses(self.data, 200) as mock:
+            self.assertTrue(tutil.binary_compare(keep_client.get(self.locator), self.data))
+
+        self.assertIsNotNone(keep_client.get_from_cache(self.locator))
+
+        with open(os.path.join(self.disk_cache_dir, self.locator[0:3], self.locator+".keepcacheblock"), "rb") as f:
+            self.assertTrue(tutil.binary_compare(f.read(), self.data))
+
+        # shrank the cache in response to ENOSPC
+        self.assertTrue(cache_max_before > block_cache.cache_max)
+
+
+    @mock.patch('mmap.mmap')
+    def test_disk_cache_retry_write_error2(self, mockmmap):
+        block_cache = arvados.keep.KeepBlockCache(disk_cache=True,
+                                                  disk_cache_dir=self.disk_cache_dir)
+
+        keep_client = arvados.KeepClient(api_client=self.api_client, block_cache=block_cache)
+
+        mockmmap.side_effect = (OSError(errno.ENOMEM, "no memory"), self.data)
+
+        slots_before = block_cache._max_slots
+
+        with tutil.mock_keep_responses(self.data, 200) as mock:
+            self.assertTrue(tutil.binary_compare(keep_client.get(self.locator), self.data))
+
+        self.assertIsNotNone(keep_client.get_from_cache(self.locator))
+
+        with open(os.path.join(self.disk_cache_dir, self.locator[0:3], self.locator+".keepcacheblock"), "rb") as f:
+            self.assertTrue(tutil.binary_compare(f.read(), self.data))
+
+        # shrank the cache in response to ENOMEM
+        self.assertTrue(slots_before > block_cache._max_slots)
diff --git a/sdk/ruby/lib/arvados.rb b/sdk/ruby/lib/arvados.rb

index a72a9f8241f442f20d6c7559baedeb79582cc218..7b99ba5788943581b4c0a2da469ebd60f32a1c03 100644 (file)
--- a/sdk/ruby/lib/arvados.rb
+++ b/sdk/ruby/lib/arvados.rb
@@ -7,6 +7,7 @@ require 'active_support/inflector'
  require 'json'
  require 'fileutils'
  require 'andand'
+require 'net/http'
  
  require 'arvados/google_api_client'
  
@@ -188,6 +189,15 @@ class Arvados
      @config = config
    end
  
+  def cluster_config
+    return @cluster_config if @cluster_config
+
+    uri = URI("https://#{config()["ARVADOS_API_HOST"]}/arvados/v1/config")
+    cc = JSON.parse(Net::HTTP.get(uri))
+
+    @cluster_config = cc
+  end
+
    class Model
      def self.arvados_api
        arvados.arvados_api
diff --git a/sdk/ruby/lib/arvados/keep.rb b/sdk/ruby/lib/arvados/keep.rb

index 458af53a748834f6f0eb22942b07c16a6187e029..e391b7a6ca027aacad81a38d85ef7ddd05133c43 100644 (file)
--- a/sdk/ruby/lib/arvados/keep.rb
+++ b/sdk/ruby/lib/arvados/keep.rb
@@ -248,7 +248,7 @@ module Keep
      end
  
      # Verify that a given manifest is valid according to
-    # https://arvados.org/projects/arvados/wiki/Keep_manifest_format
+    # https://dev.arvados.org/projects/arvados/wiki/Keep_manifest_format
      def self.validate! manifest
        raise ArgumentError.new "No manifest found" if !manifest
  
diff --git a/services/api/Gemfile.lock b/services/api/Gemfile.lock

index 6bc53be4f886286103023537dd3b335fae8f34b1..811aa0cc2e06d9f3e80718db8e21d6e2199f32fa 100644 (file)
--- a/services/api/Gemfile.lock
+++ b/services/api/Gemfile.lock
@@ -146,7 +146,7 @@ GEM
      oj (3.9.2)
      optimist (3.0.0)
      os (1.1.1)
-    passenger (6.0.2)
+    passenger (6.0.15)
        rack
        rake (>= 0.8.1)
      pg (1.1.4)
diff --git a/services/api/app/models/api_client.rb b/services/api/app/models/api_client.rb

index c914051a349685aa5f73dc419a16a17449a4b2f5..55a4c6706c7ccb802f50bdd8a2c2fbe3cee4fdee 100644 (file)
--- a/services/api/app/models/api_client.rb
+++ b/services/api/app/models/api_client.rb
@@ -43,11 +43,10 @@ class ApiClient < ArvadosModel
    def norm url
      # normalize URL for comparison
      url = URI(url.to_s)
-    if url.scheme == "https"
-      url.port == "443"
-    end
-    if url.scheme == "http"
-      url.port == "80"
+    if url.scheme == "https" && url.port == ""
+      url.port = "443"
+    elsif url.scheme == "http" && url.port == ""
+      url.port = "80"
      end
      url.path = "/"
      url
diff --git a/services/api/app/models/arvados_model.rb b/services/api/app/models/arvados_model.rb

index c2725506c02ef75a85dee2a7c3a11fbd8db7e119..1ff46c3616975f4d90e23b5ef4603facd1ccc217 100644 (file)
--- a/services/api/app/models/arvados_model.rb
+++ b/services/api/app/models/arvados_model.rb
@@ -478,12 +478,11 @@ class ArvadosModel < ApplicationRecord
        conn.exec_query 'SAVEPOINT save_with_unique_name'
        begin
          save!
+        conn.exec_query 'RELEASE SAVEPOINT save_with_unique_name'
        rescue ActiveRecord::RecordNotUnique => rn
          raise if max_retries == 0
          max_retries -= 1
  
-        conn.exec_query 'ROLLBACK TO SAVEPOINT save_with_unique_name'
-
          # Dig into the error to determine if it is specifically calling out a
          # (owner_uuid, name) uniqueness violation.  In this specific case, and
          # the client requested a unique name with ensure_unique_name==true,
@@ -501,6 +500,8 @@ class ArvadosModel < ApplicationRecord
          detail = err.result.error_field(PG::Result::PG_DIAG_MESSAGE_DETAIL)
          raise unless /^Key \(owner_uuid, name\)=\([a-z0-9]{5}-[a-z0-9]{5}-[a-z0-9]{15}, .*?\) already exists\./.match detail
  
+        conn.exec_query 'ROLLBACK TO SAVEPOINT save_with_unique_name'
+
          new_name = "#{name_was} (#{db_current_time.utc.iso8601(3)})"
          if new_name == name
            # If the database is fast enough to do two attempts in the
@@ -518,10 +519,8 @@ class ArvadosModel < ApplicationRecord
              self[:current_version_uuid] = nil
            end
          end
-        conn.exec_query 'SAVEPOINT save_with_unique_name'
+
          retry
-      ensure
-        conn.exec_query 'RELEASE SAVEPOINT save_with_unique_name'
        end
      end
    end
@@ -951,6 +950,10 @@ class ArvadosModel < ApplicationRecord
    # value in the database to an implicit zero/false value in an update
    # request.
    def fill_container_defaults
+    # Make sure this is correctly sorted by key, because we merge in
+    # whatever is in the database on top of it, this will be the order
+    # that gets used downstream rather than the order the keys appear
+    # in the database.
      self.runtime_constraints = {
        'API' => false,
        'cuda' => {
@@ -958,6 +961,7 @@ class ArvadosModel < ApplicationRecord
          'driver_version' => '',
          'hardware_capability' => '',
        },
+      'keep_cache_disk' => 0,
        'keep_cache_ram' => 0,
        'ram' => 0,
        'vcpus' => 0,
diff --git a/services/api/app/models/container.rb b/services/api/app/models/container.rb

index 3e3f73b838dab5f4809bef12cd8c3d3dc1b02b08..4b02ad52e56dc55925d9418e528434917897379e 100644 (file)
--- a/services/api/app/models/container.rb
+++ b/services/api/app/models/container.rb
@@ -227,6 +227,10 @@ class Container < ArvadosModel
      if rc['keep_cache_ram'] == 0
        rc['keep_cache_ram'] = Rails.configuration.Containers.DefaultKeepCacheRAM
      end
+    if rc['keep_cache_disk'] == 0 and rc['keep_cache_ram'] == 0
+      # Only set if keep_cache_ram isn't set.
+      rc['keep_cache_disk'] = Rails.configuration.Containers.DefaultKeepCacheDisk
+    end
      rc
    end
  
@@ -306,6 +310,15 @@ class Container < ArvadosModel
        # records that don't have a 'cuda' section in runtime_constraints
        resolved_runtime_constraints << resolved_runtime_constraints[0].except('cuda')
      end
+    if resolved_runtime_constraints[0]['keep_cache_disk'] == 0
+      # If no disk cache requested, extend search to include older container
+      # records that don't have a 'keep_cache_disk' field in runtime_constraints
+      if resolved_runtime_constraints.length == 2
+        # exclude the one that also excludes CUDA
+        resolved_runtime_constraints << resolved_runtime_constraints[1].except('keep_cache_disk')
+      end
+      resolved_runtime_constraints << resolved_runtime_constraints[0].except('keep_cache_disk')
+    end
  
      candidates = candidates.where_serialized(:runtime_constraints, resolved_runtime_constraints, md5: true, multivalue: true)
      log_reuse_info(candidates) { "after filtering on runtime_constraints #{attrs[:runtime_constraints].inspect}" }
diff --git a/services/api/app/models/user.rb b/services/api/app/models/user.rb

index 8c8039f1b842a7fa1242f0a822d964800bdf3f29..bbdd9c2843d4d810439e1f9ecafce1b0835b02ae 100644 (file)
--- a/services/api/app/models/user.rb
+++ b/services/api/app/models/user.rb
@@ -308,25 +308,20 @@ SELECT target_uuid, perm_level
  
      # delete oid_login_perms for this user
      #
-    # note: these permission links are obsolete, they have no effect
-    # on anything and they are not created for new users.
+    # note: these permission links are obsolete anyway: they have no
+    # effect on anything and they are not created for new users.
      Link.where(tail_uuid: self.email,
                 link_class: 'permission',
                 name: 'can_login').destroy_all
  
-    # delete repo_perms for this user
-    Link.where(tail_uuid: self.uuid,
-               link_class: 'permission',
-               name: 'can_manage').destroy_all
-
-    # delete vm_login_perms for this user
-    Link.where(tail_uuid: self.uuid,
-               link_class: 'permission',
-               name: 'can_login').destroy_all
-
-    # delete "All users" group read permissions for this user
+    # Delete all sharing permissions so (a) the user doesn't
+    # automatically regain access to anything if re-setup in future,
+    # (b) the user doesn't appear in "currently shared with" lists
+    # shown to other users.
+    #
+    # Notably this includes the can_read -> "all users" group
+    # permission.
      Link.where(tail_uuid: self.uuid,
-               head_uuid: all_users_group_uuid,
                 link_class: 'permission').destroy_all
  
      # delete any signatures by this user
diff --git a/services/api/lib/tasks/delete_old_container_logs.rake b/services/api/lib/tasks/delete_old_container_logs.rake

index 7a0ab3826ab1c08beee1361ff81b654b4ccff86d..db1b3667cc0a94a95eebd51b46224daab3981336 100644 (file)
--- a/services/api/lib/tasks/delete_old_container_logs.rake
+++ b/services/api/lib/tasks/delete_old_container_logs.rake
@@ -8,11 +8,9 @@
  # from the logs table.
  
  namespace :db do
-  desc "Remove old container log entries from the logs table"
+  desc "deprecated / no-op"
  
    task delete_old_container_logs: :environment do
-    delete_sql = "DELETE FROM logs WHERE id in (SELECT logs.id FROM logs JOIN containers ON logs.object_uuid = containers.uuid WHERE event_type IN ('stdout', 'stderr', 'arv-mount', 'crunch-run', 'crunchstat') AND containers.log IS NOT NULL AND now() - containers.finished_at > interval '#{Rails.configuration.Containers.Logging.MaxAge.to_i} seconds')"
-
-    ActiveRecord::Base.connection.execute(delete_sql)
+    Rails.logger.info "this db:delete_old_container_logs rake task is no longer used"
    end
  end
diff --git a/services/api/test/fixtures/containers.yml b/services/api/test/fixtures/containers.yml

index a61fb07177bba1045aca1f949bcdaa9632efb1ff..73b17280bb28db534c7802b90b3df5061bd5b14a 100644 (file)
--- a/services/api/test/fixtures/containers.yml
+++ b/services/api/test/fixtures/containers.yml
@@ -170,6 +170,7 @@ diagnostics_completed_requester:
             ]
    runtime_constraints:
      API: true
+    keep_cache_disk: 0
      keep_cache_ram: 268435456
      ram: 1342177280
      vcpus: 1
@@ -195,6 +196,7 @@ diagnostics_completed_hasher1:
             ]
    runtime_constraints:
      API: true
+    keep_cache_disk: 0
      keep_cache_ram: 268435456
      ram: 268435456
      vcpus: 1
@@ -220,6 +222,7 @@ diagnostics_completed_hasher2:
             ]
    runtime_constraints:
      API: true
+    keep_cache_disk: 0
      keep_cache_ram: 268435456
      ram: 268435456
      vcpus: 2
@@ -245,6 +248,7 @@ diagnostics_completed_hasher3:
             ]
    runtime_constraints:
      API: true
+    keep_cache_disk: 0
      keep_cache_ram: 268435456
      ram: 268435456
      vcpus: 1
@@ -281,6 +285,7 @@ diagnostics_completed_requester2:
             ]
    runtime_constraints:
      API: true
+    keep_cache_disk: 0
      keep_cache_ram: 268435456
      ram: 1342177280
      vcpus: 1
diff --git a/services/api/test/functional/arvados/v1/collections_controller_test.rb b/services/api/test/functional/arvados/v1/collections_controller_test.rb

index af11715982a1adf26226a986c54bc9b6f69676c9..8a1d044d6a760fca9ec969114382eef77b71d2ef 100644 (file)
--- a/services/api/test/functional/arvados/v1/collections_controller_test.rb
+++ b/services/api/test/functional/arvados/v1/collections_controller_test.rb
@@ -374,6 +374,24 @@ EOS
             "Expected 'duplicate key' error in #{response_errors.first}")
    end
  
+  [false, true].each do |ensure_unique_name|
+    test "create failure with duplicate name, ensure_unique_name #{ensure_unique_name}" do
+      authorize_with :active
+      post :create, params: {
+             collection: {
+               owner_uuid: users(:active).uuid,
+               manifest_text: "",
+               name: "this...............................................................................................................................................................................................................................................................name is too long"
+             },
+             ensure_unique_name: ensure_unique_name
+           }
+      assert_response 422
+      # check the real error isn't masked by an
+      # ensure_unique_name-related error (#19698)
+      assert_match /value too long for type/, json_response['errors'][0]
+    end
+  end
+
    [false, true].each do |unsigned|
      test "create with duplicate name, ensure_unique_name, unsigned=#{unsigned}" do
        permit_unsigned_manifests unsigned
diff --git a/services/api/test/integration/users_test.rb b/services/api/test/integration/users_test.rb

index f7fddb44d371c727a0da1b9ef314004fe67f1d6d..ca143363892cad7065e65d704d1c76bbd7551c83 100644 (file)
--- a/services/api/test/integration/users_test.rb
+++ b/services/api/test/integration/users_test.rb
@@ -203,6 +203,22 @@ class UsersTest < ActionDispatch::IntegrationTest
        ApiClientAuthorization.create!(user: User.find_by_uuid(created['uuid']), api_client: ApiClient.all.first).api_token
      end
  
+    # share project and collections with the new user
+    act_as_system_user do
+      Link.create!(tail_uuid: created['uuid'],
+                   head_uuid: groups(:aproject).uuid,
+                   link_class: 'permission',
+                   name: 'can_manage')
+      Link.create!(tail_uuid: created['uuid'],
+                   head_uuid: collections(:collection_owned_by_active).uuid,
+                   link_class: 'permission',
+                   name: 'can_read')
+      Link.create!(tail_uuid: created['uuid'],
+                   head_uuid: collections(:collection_owned_by_active_with_file_stats).uuid,
+                   link_class: 'permission',
+                   name: 'can_write')
+    end
+
      assert_equal 1, ApiClientAuthorization.where(user_id: User.find_by_uuid(created['uuid']).id).size, 'expected token not found'
  
      post "/arvados/v1/users/#{created['uuid']}/unsetup", params: {}, headers: auth(:admin)
@@ -213,6 +229,8 @@ class UsersTest < ActionDispatch::IntegrationTest
      assert_not_nil created2['uuid'], 'expected uuid for the newly created user'
      assert_equal created['uuid'], created2['uuid'], 'expected uuid not found'
      assert_equal 0, ApiClientAuthorization.where(user_id: User.find_by_uuid(created['uuid']).id).size, 'token should have been deleted by user unsetup'
+    # check permissions are deleted
+    assert_empty Link.where(tail_uuid: created['uuid'])
  
      verify_link_existence created['uuid'], created['email'], false, false, false, false, false
    end
diff --git a/services/api/test/tasks/delete_old_container_logs_test.rb b/services/api/test/tasks/delete_old_container_logs_test.rb

deleted file mode 100644 (file)

index c81b331..0000000
--- a/services/api/test/tasks/delete_old_container_logs_test.rb
+++ /dev/null
@@ -1,54 +0,0 @@
-# Copyright (C) The Arvados Authors. All rights reserved.
-#
-# SPDX-License-Identifier: AGPL-3.0
-
-require 'test_helper'
-require 'rake'
-
-Rake.application.rake_require "tasks/delete_old_container_logs"
-Rake::Task.define_task(:environment)
-
-class DeleteOldContainerLogsTaskTest < ActiveSupport::TestCase
-  TASK_NAME = "db:delete_old_container_logs"
-
-  def log_uuids(*fixture_names)
-    fixture_names.map { |name| logs(name).uuid }
-  end
-
-  def run_with_expiry(clean_after)
-    Rails.configuration.Containers.Logging.MaxAge = clean_after
-    Rake::Task[TASK_NAME].reenable
-    Rake.application.invoke_task TASK_NAME
-  end
-
-  def check_log_existence(test_method, fixture_uuids)
-    uuids_now = Log.where("object_uuid LIKE :pattern AND event_type in ('stdout', 'stderr', 'arv-mount', 'crunch-run', 'crunchstat')", pattern: "%-dz642-%").map(&:uuid)
-    fixture_uuids.each do |expect_uuid|
-      send(test_method, uuids_now, expect_uuid)
-    end
-  end
-
-  test "delete all finished logs" do
-    uuids_to_keep = log_uuids(:stderr_for_running_container,
-                              :crunchstat_for_running_container)
-    uuids_to_clean = log_uuids(:stderr_for_previous_container,
-                               :crunchstat_for_previous_container,
-                               :stderr_for_ancient_container,
-                               :crunchstat_for_ancient_container)
-    run_with_expiry(1)
-    check_log_existence(:assert_includes, uuids_to_keep)
-    check_log_existence(:refute_includes, uuids_to_clean)
-  end
-
-  test "delete old finished logs" do
-    uuids_to_keep = log_uuids(:stderr_for_running_container,
-                              :crunchstat_for_running_container,
-                              :stderr_for_previous_container,
-                              :crunchstat_for_previous_container)
-    uuids_to_clean = log_uuids(:stderr_for_ancient_container,
-                               :crunchstat_for_ancient_container)
-    run_with_expiry(360.days)
-    check_log_existence(:assert_includes, uuids_to_keep)
-    check_log_existence(:refute_includes, uuids_to_clean)
-  end
-end
diff --git a/services/api/test/unit/container_request_test.rb b/services/api/test/unit/container_request_test.rb

index e6db412179b663e39696e9c884af584af287ddbf..efc61eee8c80fcfa509478ebc0ec51e947e3cccb 100644 (file)
--- a/services/api/test/unit/container_request_test.rb
+++ b/services/api/test/unit/container_request_test.rb
@@ -177,6 +177,9 @@ class ContainerRequestTest < ActiveSupport::TestCase
  
      assert ({"vcpus" => 2, "ram" => 30}.to_a - cr.runtime_constraints.to_a).empty?
  
+    assert_equal 0, Rails.configuration.Containers.DefaultKeepCacheRAM
+    assert_equal 8589934592, Rails.configuration.Containers.DefaultKeepCacheDisk
+
      assert_not_nil cr.container_uuid
      c = Container.find_by_uuid cr.container_uuid
      assert_not_nil c
@@ -186,7 +189,7 @@ class ContainerRequestTest < ActiveSupport::TestCase
      assert_equal({}, c.environment)
      assert_equal({"/out" => {"kind"=>"tmp", "capacity"=>1000000}}, c.mounts)
      assert_equal "/out", c.output_path
-    assert ({"keep_cache_ram"=>268435456, "vcpus" => 2, "ram" => 30}.to_a - c.runtime_constraints.to_a).empty?
+    assert ({"keep_cache_disk"=>8589934592, "keep_cache_ram"=>0, "vcpus" => 2, "ram" => 30}.to_a - c.runtime_constraints.to_a).empty?
      assert_operator 0, :<, c.priority
  
      assert_raises(ActiveRecord::RecordInvalid) do
diff --git a/services/api/test/unit/container_test.rb b/services/api/test/unit/container_test.rb

index a4c0ce17926092ec451583404a21f56374f79176..f804aca2d982fd8d000fcf10d19eec0d47173965 100644 (file)
--- a/services/api/test/unit/container_test.rb
+++ b/services/api/test/unit/container_test.rb
@@ -24,6 +24,7 @@ class ContainerTest < ActiveSupport::TestCase
      output_path: "test",
      runtime_constraints: {
        "API" => false,
+      "keep_cache_disk" => 0,
        "keep_cache_ram" => 0,
        "ram" => 12000000000,
        "vcpus" => 4
@@ -229,7 +230,7 @@ class ContainerTest < ActiveSupport::TestCase
      set_user_from_auth :active
      env = {"C" => "3", "B" => "2", "A" => "1"}
      m = {"F" => {"kind" => "3"}, "E" => {"kind" => "2"}, "D" => {"kind" => "1"}}
-    rc = {"vcpus" => 1, "ram" => 1, "keep_cache_ram" => 1, "API" => true, "cuda" => {"device_count":0, "driver_version": "", "hardware_capability": ""}}
+    rc = {"vcpus" => 1, "ram" => 1, "keep_cache_ram" => 1, "keep_cache_disk" => 0, "API" => true, "cuda" => {"device_count":0, "driver_version": "", "hardware_capability": ""}}
      c, _ = minimal_new(environment: env, mounts: m, runtime_constraints: rc)
      c.reload
      assert_equal Container.deep_sort_hash(env).to_json, c.environment.to_json
@@ -594,14 +595,14 @@ class ContainerTest < ActiveSupport::TestCase
      set_user_from_auth :active
      # No cuda
      no_cuda_attrs = REUSABLE_COMMON_ATTRS.merge({use_existing:false, priority:1, environment:{"var" => "queued"},
-                                                runtime_constraints: {"vcpus" => 1, "ram" => 1, "keep_cache_ram"=>268435456, "API" => false,
+                                                runtime_constraints: {"vcpus" => 1, "ram" => 1, "keep_cache_disk"=>0, "keep_cache_ram"=>268435456, "API" => false,
                                                                        "cuda" => {"device_count":0, "driver_version": "", "hardware_capability": ""}},})
      c1, _ = minimal_new(no_cuda_attrs)
      assert_equal Container::Queued, c1.state
  
      # has cuda
      cuda_attrs = REUSABLE_COMMON_ATTRS.merge({use_existing:false, priority:1, environment:{"var" => "queued"},
-                                                runtime_constraints: {"vcpus" => 1, "ram" => 1, "keep_cache_ram"=>268435456, "API" => false,
+                                                runtime_constraints: {"vcpus" => 1, "ram" => 1, "keep_cache_disk"=>0, "keep_cache_ram"=>268435456, "API" => false,
                                                                        "cuda" => {"device_count":1, "driver_version": "11.0", "hardware_capability": "9.0"}},})
      c2, _ = minimal_new(cuda_attrs)
      assert_equal Container::Queued, c2.state
diff --git a/services/crunch-dispatch-slurm/crunch-dispatch-slurm.go b/services/crunch-dispatch-slurm/crunch-dispatch-slurm.go

index ac394e114962ddf05d2e71e94cc4bb1ff46c4780..1c0f6ad28f5ba7b6d20bcc0cadbef0fb87fec634 100644 (file)
--- a/services/crunch-dispatch-slurm/crunch-dispatch-slurm.go
+++ b/services/crunch-dispatch-slurm/crunch-dispatch-slurm.go
@@ -19,6 +19,8 @@ import (
         "time"
  
         "git.arvados.org/arvados.git/lib/cmd"
+       "git.arvados.org/arvados.git/lib/controller/dblock"
+       "git.arvados.org/arvados.git/lib/ctrlctx"
         "git.arvados.org/arvados.git/lib/dispatchcloud"
         "git.arvados.org/arvados.git/lib/service"
         "git.arvados.org/arvados.git/sdk/go/arvados"
@@ -55,10 +57,11 @@ const initialNiceValue int64 = 10000
  
  type Dispatcher struct {
         *dispatch.Dispatcher
-       logger  logrus.FieldLogger
-       cluster *arvados.Cluster
-       sqCheck *SqueueChecker
-       slurm   Slurm
+       logger      logrus.FieldLogger
+       cluster     *arvados.Cluster
+       sqCheck     *SqueueChecker
+       slurm       Slurm
+       dbConnector ctrlctx.DBConnector
  
         done chan struct{}
         err  error
@@ -90,6 +93,7 @@ func (disp *Dispatcher) configure() error {
         disp.Client.APIHost = disp.cluster.Services.Controller.ExternalURL.Host
         disp.Client.AuthToken = disp.cluster.SystemRootToken
         disp.Client.Insecure = disp.cluster.TLS.Insecure
+       disp.dbConnector = ctrlctx.DBConnector{PostgreSQL: disp.cluster.PostgreSQL}
  
         if disp.Client.APIHost != "" || disp.Client.AuthToken != "" {
                 // Copy real configs into env vars so [a]
@@ -137,6 +141,8 @@ func (disp *Dispatcher) setup() {
  }
  
  func (disp *Dispatcher) run() error {
+       dblock.Dispatch.Lock(context.Background(), disp.dbConnector.GetDB)
+       defer dblock.Dispatch.Unlock()
         defer disp.sqCheck.Stop()
  
         if disp.cluster != nil && len(disp.cluster.InstanceTypes) > 0 {
diff --git a/services/crunchstat/crunchstat.go b/services/crunchstat/crunchstat.go

index 6383eae5452dd1d145420e7da41ce773878b5cef..d28bee0f5e19591275eab2ae43d2a640d316de6d 100644 (file)
--- a/services/crunchstat/crunchstat.go
+++ b/services/crunchstat/crunchstat.go
@@ -28,6 +28,10 @@ var (
         version               = "dev"
  )
  
+type logger interface {
+       Printf(string, ...interface{})
+}
+
  func main() {
         reporter := crunchstat.Reporter{
                 Logger: log.New(os.Stderr, "crunchstat: ", 0),
@@ -55,9 +59,11 @@ func main() {
         reporter.Logger.Printf("crunchstat %s started", version)
  
         if reporter.CgroupRoot == "" {
-               reporter.Logger.Fatal("error: must provide -cgroup-root")
+               reporter.Logger.Printf("error: must provide -cgroup-root")
+               os.Exit(2)
         } else if signalOnDeadPPID < 0 {
-               reporter.Logger.Fatalf("-signal-on-dead-ppid=%d is invalid (use a positive signal number, or 0 to disable)", signalOnDeadPPID)
+               reporter.Logger.Printf("-signal-on-dead-ppid=%d is invalid (use a positive signal number, or 0 to disable)", signalOnDeadPPID)
+               os.Exit(2)
         }
         reporter.PollPeriod = time.Duration(*pollMsec) * time.Millisecond
  
@@ -76,17 +82,19 @@ func main() {
                 if status, ok := err.Sys().(syscall.WaitStatus); ok {
                         os.Exit(status.ExitStatus())
                 } else {
-                       reporter.Logger.Fatalln("ExitError without WaitStatus:", err)
+                       reporter.Logger.Printf("ExitError without WaitStatus: %v", err)
+                       os.Exit(1)
                 }
         } else if err != nil {
-               reporter.Logger.Fatalln("error in cmd.Wait:", err)
+               reporter.Logger.Printf("error running command: %v", err)
+               os.Exit(1)
         }
  }
  
-func runCommand(argv []string, logger *log.Logger) error {
+func runCommand(argv []string, logger logger) error {
         cmd := exec.Command(argv[0], argv[1:]...)
  
-       logger.Println("Running", argv)
+       logger.Printf("Running %v", argv)
  
         // Child process will use our stdin and stdout pipes
         // (we close our copies below)
@@ -100,7 +108,7 @@ func runCommand(argv []string, logger *log.Logger) error {
                 if cmd.Process != nil {
                         cmd.Process.Signal(catch)
                 }
-               logger.Println("notice: caught signal:", catch)
+               logger.Printf("notice: caught signal: %v", catch)
         }(sigChan)
         signal.Notify(sigChan, syscall.SIGTERM)
         signal.Notify(sigChan, syscall.SIGINT)
@@ -113,24 +121,30 @@ func runCommand(argv []string, logger *log.Logger) error {
         // Funnel stderr through our channel
         stderrPipe, err := cmd.StderrPipe()
         if err != nil {
-               logger.Fatalln("error in StderrPipe:", err)
+               logger.Printf("error in StderrPipe: %v", err)
+               return err
         }
  
         // Run subprocess
         if err := cmd.Start(); err != nil {
-               logger.Fatalln("error in cmd.Start:", err)
+               logger.Printf("error in cmd.Start: %v", err)
+               return err
         }
  
         // Close stdin/stdout in this (parent) process
         os.Stdin.Close()
         os.Stdout.Close()
  
-       copyPipeToChildLog(stderrPipe, log.New(os.Stderr, "", 0))
+       err = copyPipeToChildLog(stderrPipe, log.New(os.Stderr, "", 0))
+       if err != nil {
+               cmd.Process.Kill()
+               return err
+       }
  
         return cmd.Wait()
  }
  
-func sendSignalOnDeadPPID(intvl time.Duration, signum, ppidOrig int, cmd *exec.Cmd, logger *log.Logger) {
+func sendSignalOnDeadPPID(intvl time.Duration, signum, ppidOrig int, cmd *exec.Cmd, logger logger) {
         ticker := time.NewTicker(intvl)
         for range ticker.C {
                 ppid := os.Getppid()
@@ -152,7 +166,7 @@ func sendSignalOnDeadPPID(intvl time.Duration, signum, ppidOrig int, cmd *exec.C
         }
  }
  
-func copyPipeToChildLog(in io.ReadCloser, logger *log.Logger) {
+func copyPipeToChildLog(in io.ReadCloser, logger logger) error {
         reader := bufio.NewReaderSize(in, MaxLogLine)
         var prefix string
         for {
@@ -160,13 +174,13 @@ func copyPipeToChildLog(in io.ReadCloser, logger *log.Logger) {
                 if err == io.EOF {
                         break
                 } else if err != nil {
-                       logger.Fatal("error reading child stderr:", err)
+                       return fmt.Errorf("error reading child stderr: %w", err)
                 }
                 var suffix string
                 if isPrefix {
                         suffix = "[...]"
                 }
-               logger.Print(prefix, string(line), suffix)
+               logger.Printf("%s%s%s", prefix, string(line), suffix)
                 // Set up prefix for following line
                 if isPrefix {
                         prefix = "[...]"
@@ -174,5 +188,5 @@ func copyPipeToChildLog(in io.ReadCloser, logger *log.Logger) {
                         prefix = ""
                 }
         }
-       in.Close()
+       return in.Close()
  }
diff --git a/services/fuse/README.rst b/services/fuse/README.rst

index 0416d3dbd2cc6eaddcf780326bca845c2cb55710..e0d5046ae25e9cb7058e9bd85ba6673d2cbc8de8 100644 (file)
--- a/services/fuse/README.rst
+++ b/services/fuse/README.rst
@@ -66,5 +66,5 @@ $ apt-get install python-dev pkg-config libfuse-dev libattr1-dev
  This package is one part of the Arvados source package, and it has
  integration tests to check interoperability with other Arvados
  components.  Our `hacking guide
-<https://arvados.org/projects/arvados/wiki/Hacking_Python_SDK>`_
+<https://dev.arvados.org/projects/arvados/wiki/Hacking_Python_SDK>`_
  describes how to set up a development environment and run tests.
diff --git a/services/fuse/arvados_fuse/command.py b/services/fuse/arvados_fuse/command.py

index 5f0a1f80f6a4e9f693c91b8946ce41cac6c2f227..994c998823905e4f2398b15eb911768de6e03aa5 100644 (file)
--- a/services/fuse/arvados_fuse/command.py
+++ b/services/fuse/arvados_fuse/command.py
@@ -83,13 +83,20 @@ class ArgumentParser(argparse.ArgumentParser):
                              type=str, metavar='PATH', action='append', default=[],
                              help="Create a new collection, mount it in read/write mode at mountpoint/PATH, and delete it when unmounting.")
  
+
          self.add_argument('--debug', action='store_true', help="""Debug mode""")
          self.add_argument('--logfile', help="""Write debug logs and errors to the specified file (default stderr).""")
          self.add_argument('--foreground', action='store_true', help="""Run in foreground (default is to daemonize unless --exec specified)""", default=False)
          self.add_argument('--encoding', type=str, help="Character encoding to use for filesystem, default is utf-8 (see Python codec registry for list of available encodings)", default="utf-8")
  
-        self.add_argument('--file-cache', type=int, help="File data cache size, in bytes (default 256MiB)", default=256*1024*1024)
-        self.add_argument('--directory-cache', type=int, help="Directory data cache size, in bytes (default 128MiB)", default=128*1024*1024)
+        self.add_argument('--file-cache', type=int, help="File data cache size, in bytes (default 8 GiB for disk-based cache or 256 MiB with RAM-only cache)", default=0)
+        self.add_argument('--directory-cache', type=int, help="Directory data cache size, in bytes (default 128 MiB)", default=128*1024*1024)
+
+        cachetype = self.add_mutually_exclusive_group()
+        cachetype.add_argument('--ram-cache', action='store_false', dest='disk_cache', help="Use in-memory caching only", default=True)
+        cachetype.add_argument('--disk-cache', action='store_true', dest='disk_cache', help="Use disk based caching (default)", default=True)
+
+        self.add_argument('--disk-cache-dir', type=str, help="Disk cache location (default ~/.cache/arvados/keep)", default=None)
  
          self.add_argument('--disable-event-listening', action='store_true', help="Don't subscribe to events on the API server", dest="disable_event_listening", default=False)
  
@@ -213,8 +220,12 @@ class Mount(object):
          try:
              self.api = arvados.safeapi.ThreadSafeApiCache(
                  apiconfig=arvados.config.settings(),
+                # default value of file_cache is 0, this tells KeepBlockCache to
+                # choose a default based on whether disk_cache is enabled or not.
                  keep_params={
-                    'block_cache': arvados.keep.KeepBlockCache(self.args.file_cache),
+                    'block_cache': arvados.keep.KeepBlockCache(cache_max=self.args.file_cache,
+                                                               disk_cache=self.args.disk_cache,
+                                                               disk_cache_dir=self.args.disk_cache_dir),
                      'num_retries': self.args.retries,
                  })
          except KeyError as e:
diff --git a/services/fuse/setup.py b/services/fuse/setup.py

index 545b4bfa01c70135585491dcb2c946bd847a4871..d0c46f132040aa400645473ddf347c53be135d23 100644 (file)
--- a/services/fuse/setup.py
+++ b/services/fuse/setup.py
@@ -59,6 +59,6 @@ setup(name='arvados_fuse',
            'Programming Language :: Python :: 3',
        ],
        test_suite='tests',
-      tests_require=['pbr<1.7.0', 'mock>=1.0', 'PyYAML'],
+      tests_require=['pbr<1.7.0', 'mock>=1.0', 'PyYAML', 'parameterized',],
        zip_safe=False
        )
diff --git a/services/fuse/tests/mount_test_base.py b/services/fuse/tests/mount_test_base.py

index 7cf8aa373a9e3b215593d507da0bb216531cf8d4..e82660408bbeb784f07dda1db344991de882f9c4 100644 (file)
--- a/services/fuse/tests/mount_test_base.py
+++ b/services/fuse/tests/mount_test_base.py
@@ -4,6 +4,7 @@
  
  from __future__ import absolute_import
  import arvados
+import arvados.keep
  import arvados_fuse as fuse
  import arvados.safeapi
  import llfuse
@@ -24,7 +25,16 @@ logger = logging.getLogger('arvados.arv-mount')
  
  from .integration_test import workerPool
  
+def make_block_cache(disk_cache):
+    if disk_cache:
+        disk_cache_dir = os.path.join(os.path.expanduser("~"), ".cache", "arvados", "keep")
+        shutil.rmtree(disk_cache_dir, ignore_errors=True)
+    block_cache = arvados.keep.KeepBlockCache(disk_cache=disk_cache)
+    return block_cache
+
  class MountTestBase(unittest.TestCase):
+    disk_cache = False
+
      def setUp(self, api=None, local_store=True):
          # The underlying C implementation of open() makes a fstat() syscall
          # with the GIL still held.  When the GETATTR message comes back to
@@ -43,7 +53,8 @@ class MountTestBase(unittest.TestCase):
          self.mounttmp = tempfile.mkdtemp()
          run_test_server.run()
          run_test_server.authorize_with("admin")
-        self.api = api if api else arvados.safeapi.ThreadSafeApiCache(arvados.config.settings())
+
+        self.api = api if api else arvados.safeapi.ThreadSafeApiCache(arvados.config.settings(), keep_params={"block_cache": make_block_cache(self.disk_cache)})
          self.llfuse_thread = None
  
      # This is a copy of Mount's method.  TODO: Refactor MountTestBase
diff --git a/services/fuse/tests/test_mount.py b/services/fuse/tests/test_mount.py

index 1601db59440be8b57c35b988869a1a56229ef92b..df3d4263417bcc271b77c05dc75aec0ee8343aea 100644 (file)
--- a/services/fuse/tests/test_mount.py
+++ b/services/fuse/tests/test_mount.py
@@ -16,6 +16,7 @@ import subprocess
  import time
  import unittest
  import tempfile
+import parameterized
  
  import arvados
  import arvados_fuse as fuse
@@ -54,7 +55,7 @@ class AssertWithTimeout(object):
          else:
              self.done = True
  
-
+@parameterized.parameterized_class([{"disk_cache": True}, {"disk_cache": False}])
  class FuseMountTest(MountTestBase):
      def setUp(self):
          super(FuseMountTest, self).setUp()
@@ -125,6 +126,7 @@ class FuseMountTest(MountTestBase):
                  self.assertEqual(v, f.read().decode())
  
  
+@parameterized.parameterized_class([{"disk_cache": True}, {"disk_cache": False}])
  class FuseMagicTest(MountTestBase):
      def setUp(self, api=None):
          super(FuseMagicTest, self).setUp(api=api)
@@ -283,6 +285,7 @@ def fuseSharedTestHelper(mounttmp):
  
      Test().runTest()
  
+@parameterized.parameterized_class([{"disk_cache": True}, {"disk_cache": False}])
  class FuseSharedTest(MountTestBase):
      def runTest(self):
          self.make_mount(fuse.SharedDirectory,
@@ -343,6 +346,7 @@ def fuseModifyFileTestHelperReadEndContents(mounttmp):
                  self.assertEqual("plnp", f.read())
      Test().runTest()
  
+@parameterized.parameterized_class([{"disk_cache": True}, {"disk_cache": False}])
  class FuseModifyFileTest(MountTestBase):
      def runTest(self):
          collection = arvados.collection.Collection(api_client=self.api)
@@ -363,6 +367,7 @@ class FuseModifyFileTest(MountTestBase):
          self.pool.apply(fuseModifyFileTestHelperReadEndContents, (self.mounttmp,))
  
  
+@parameterized.parameterized_class([{"disk_cache": True}, {"disk_cache": False}])
  class FuseAddFileToCollectionTest(MountTestBase):
      def runTest(self):
          collection = arvados.collection.Collection(api_client=self.api)
@@ -385,6 +390,7 @@ class FuseAddFileToCollectionTest(MountTestBase):
          self.assertEqual(["file1.txt", "file2.txt"], sorted(d1))
  
  
+@parameterized.parameterized_class([{"disk_cache": True}, {"disk_cache": False}])
  class FuseRemoveFileFromCollectionTest(MountTestBase):
      def runTest(self):
          collection = arvados.collection.Collection(api_client=self.api)
@@ -416,6 +422,7 @@ def fuseCreateFileTestHelper(mounttmp):
                  pass
      Test().runTest()
  
+@parameterized.parameterized_class([{"disk_cache": True}, {"disk_cache": False}])
  class FuseCreateFileTest(MountTestBase):
      def runTest(self):
          collection = arvados.collection.Collection(api_client=self.api)
@@ -459,6 +466,7 @@ def fuseWriteFileTestHelperReadFile(mounttmp):
                  self.assertEqual(f.read(), "Hello world!")
      Test().runTest()
  
+@parameterized.parameterized_class([{"disk_cache": True}, {"disk_cache": False}])
  class FuseWriteFileTest(MountTestBase):
      def runTest(self):
          collection = arvados.collection.Collection(api_client=self.api)
@@ -507,6 +515,7 @@ def fuseUpdateFileTestHelper(mounttmp):
  
      Test().runTest()
  
+@parameterized.parameterized_class([{"disk_cache": True}, {"disk_cache": False}])
  class FuseUpdateFileTest(MountTestBase):
      def runTest(self):
          collection = arvados.collection.Collection(api_client=self.api)
diff --git a/services/keep-balance/balance.go b/services/keep-balance/balance.go

index 1dedb409a4a2de5c4f414959b024e291007d42b1..9f581751d938baf8d0f8fdc726bfae92e1f6877d 100644 (file)
--- a/services/keep-balance/balance.go
+++ b/services/keep-balance/balance.go
@@ -23,7 +23,9 @@ import (
         "syscall"
         "time"
  
+       "git.arvados.org/arvados.git/lib/controller/dblock"
         "git.arvados.org/arvados.git/sdk/go/arvados"
+       "git.arvados.org/arvados.git/sdk/go/ctxlog"
         "git.arvados.org/arvados.git/sdk/go/keepclient"
         "github.com/jmoiron/sqlx"
         "github.com/sirupsen/logrus"
@@ -67,16 +69,19 @@ type Balancer struct {
  // subsequent balance operation.
  //
  // Run should only be called once on a given Balancer object.
-//
-// Typical usage:
-//
-//   runOptions, err = (&Balancer{}).Run(config, runOptions)
-func (bal *Balancer) Run(client *arvados.Client, cluster *arvados.Cluster, runOptions RunOptions) (nextRunOptions RunOptions, err error) {
+func (bal *Balancer) Run(ctx context.Context, client *arvados.Client, cluster *arvados.Cluster, runOptions RunOptions) (nextRunOptions RunOptions, err error) {
         nextRunOptions = runOptions
  
+       ctxlog.FromContext(ctx).Info("acquiring active lock")
+       if !dblock.KeepBalanceActive.Lock(ctx, func(context.Context) (*sqlx.DB, error) { return bal.DB, nil }) {
+               // context canceled
+               return
+       }
+       defer dblock.KeepBalanceActive.Unlock()
+
         defer bal.time("sweep", "wall clock time to run one full sweep")()
  
-       ctx, cancel := context.WithDeadline(context.Background(), time.Now().Add(cluster.Collections.BalanceTimeout.Duration()))
+       ctx, cancel := context.WithDeadline(ctx, time.Now().Add(cluster.Collections.BalanceTimeout.Duration()))
         defer cancel()
  
         var lbFile *os.File
diff --git a/services/keep-balance/balance_run_test.go b/services/keep-balance/balance_run_test.go

index 2db7bea173c17dc41f6943b4fe579cbc7d15a24f..4772da55a2d6dddc79acff891dee1034781f7582 100644 (file)
--- a/services/keep-balance/balance_run_test.go
+++ b/services/keep-balance/balance_run_test.go
@@ -6,6 +6,7 @@ package keepbalance
  
  import (
         "bytes"
+       "context"
         "encoding/json"
         "fmt"
         "io"
@@ -372,7 +373,7 @@ func (s *runSuite) TestRefuseZeroCollections(c *check.C) {
         trashReqs := s.stub.serveKeepstoreTrash()
         pullReqs := s.stub.serveKeepstorePull()
         srv := s.newServer(&opts)
-       _, err = srv.runOnce()
+       _, err = srv.runOnce(context.Background())
         c.Check(err, check.ErrorMatches, "received zero collections")
         c.Check(trashReqs.Count(), check.Equals, 4)
         c.Check(pullReqs.Count(), check.Equals, 0)
@@ -391,7 +392,7 @@ func (s *runSuite) TestRefuseNonAdmin(c *check.C) {
         trashReqs := s.stub.serveKeepstoreTrash()
         pullReqs := s.stub.serveKeepstorePull()
         srv := s.newServer(&opts)
-       _, err := srv.runOnce()
+       _, err := srv.runOnce(context.Background())
         c.Check(err, check.ErrorMatches, "current user .* is not .* admin user")
         c.Check(trashReqs.Count(), check.Equals, 0)
         c.Check(pullReqs.Count(), check.Equals, 0)
@@ -417,7 +418,7 @@ func (s *runSuite) TestRefuseSameDeviceDifferentVolumes(c *check.C) {
         trashReqs := s.stub.serveKeepstoreTrash()
         pullReqs := s.stub.serveKeepstorePull()
         srv := s.newServer(&opts)
-       _, err := srv.runOnce()
+       _, err := srv.runOnce(context.Background())
         c.Check(err, check.ErrorMatches, "cannot continue with config errors.*")
         c.Check(trashReqs.Count(), check.Equals, 0)
         c.Check(pullReqs.Count(), check.Equals, 0)
@@ -442,7 +443,7 @@ func (s *runSuite) TestWriteLostBlocks(c *check.C) {
         s.stub.serveKeepstorePull()
         srv := s.newServer(&opts)
         c.Assert(err, check.IsNil)
-       _, err = srv.runOnce()
+       _, err = srv.runOnce(context.Background())
         c.Check(err, check.IsNil)
         lost, err := ioutil.ReadFile(lostf.Name())
         c.Assert(err, check.IsNil)
@@ -463,7 +464,7 @@ func (s *runSuite) TestDryRun(c *check.C) {
         trashReqs := s.stub.serveKeepstoreTrash()
         pullReqs := s.stub.serveKeepstorePull()
         srv := s.newServer(&opts)
-       bal, err := srv.runOnce()
+       bal, err := srv.runOnce(context.Background())
         c.Check(err, check.IsNil)
         for _, req := range collReqs.reqs {
                 c.Check(req.Form.Get("include_trash"), check.Equals, "true")
@@ -493,7 +494,7 @@ func (s *runSuite) TestCommit(c *check.C) {
         trashReqs := s.stub.serveKeepstoreTrash()
         pullReqs := s.stub.serveKeepstorePull()
         srv := s.newServer(&opts)
-       bal, err := srv.runOnce()
+       bal, err := srv.runOnce(context.Background())
         c.Check(err, check.IsNil)
         c.Check(trashReqs.Count(), check.Equals, 8)
         c.Check(pullReqs.Count(), check.Equals, 4)
@@ -533,13 +534,14 @@ func (s *runSuite) TestRunForever(c *check.C) {
         trashReqs := s.stub.serveKeepstoreTrash()
         pullReqs := s.stub.serveKeepstorePull()
  
-       stop := make(chan interface{})
+       ctx, cancel := context.WithCancel(context.Background())
+       defer cancel()
         s.config.Collections.BalancePeriod = arvados.Duration(time.Millisecond)
         srv := s.newServer(&opts)
  
         done := make(chan bool)
         go func() {
-               srv.runForever(stop)
+               srv.runForever(ctx)
                 close(done)
         }()
  
@@ -550,7 +552,7 @@ func (s *runSuite) TestRunForever(c *check.C) {
         for t0 := time.Now(); pullReqs.Count() < 16 && time.Since(t0) < 10*time.Second; {
                 time.Sleep(time.Millisecond)
         }
-       stop <- true
+       cancel()
         <-done
         c.Check(pullReqs.Count() >= 16, check.Equals, true)
         c.Check(trashReqs.Count(), check.Equals, pullReqs.Count()+4)
diff --git a/services/keep-balance/integration_test.go b/services/keep-balance/integration_test.go

index 3cfb5cdeda5039fb37f414f5cd0b095eea0e772d..42463a002a5ec73652f7f7ef6f00f8a8c4fb44a1 100644 (file)
--- a/services/keep-balance/integration_test.go
+++ b/services/keep-balance/integration_test.go
@@ -6,6 +6,7 @@ package keepbalance
  
  import (
         "bytes"
+       "context"
         "io"
         "os"
         "strings"
@@ -97,7 +98,7 @@ func (s *integrationSuite) TestBalanceAPIFixtures(c *check.C) {
                         Logger:  logger,
                         Metrics: newMetrics(prometheus.NewRegistry()),
                 }
-               nextOpts, err := bal.Run(s.client, s.config, opts)
+               nextOpts, err := bal.Run(context.Background(), s.client, s.config, opts)
                 c.Check(err, check.IsNil)
                 c.Check(nextOpts.SafeRendezvousState, check.Not(check.Equals), "")
                 c.Check(nextOpts.CommitPulls, check.Equals, true)
diff --git a/services/keep-balance/main.go b/services/keep-balance/main.go

index f0b0df5bd331d6a97a2cdaab0a8d968cfdbfc550..b016db22ffe67f6316f1e4f537bfa680f135ecad 100644 (file)
--- a/services/keep-balance/main.go
+++ b/services/keep-balance/main.go
@@ -112,7 +112,7 @@ func (command) RunCommand(prog string, args []string, stdin io.Reader, stdout, s
                                 Routes: health.Routes{"ping": srv.CheckHealth},
                         }
  
-                       go srv.run()
+                       go srv.run(ctx)
                         return srv
                 }).RunCommand(prog, args, stdin, stdout, stderr)
  }
diff --git a/services/keep-balance/server.go b/services/keep-balance/server.go

index e485f5b2061f28134306d1d897b22cb62e4190e9..fd53497f789ed4f5f1db458f99e69f8e7f10c1a7 100644 (file)
--- a/services/keep-balance/server.go
+++ b/services/keep-balance/server.go
@@ -5,12 +5,14 @@
  package keepbalance
  
  import (
+       "context"
         "net/http"
         "os"
         "os/signal"
         "syscall"
         "time"
  
+       "git.arvados.org/arvados.git/lib/controller/dblock"
         "git.arvados.org/arvados.git/sdk/go/arvados"
         "github.com/jmoiron/sqlx"
         "github.com/sirupsen/logrus"
@@ -62,12 +64,12 @@ func (srv *Server) Done() <-chan struct{} {
         return nil
  }
  
-func (srv *Server) run() {
+func (srv *Server) run(ctx context.Context) {
         var err error
         if srv.RunOptions.Once {
-               _, err = srv.runOnce()
+               _, err = srv.runOnce(ctx)
         } else {
-               err = srv.runForever(nil)
+               err = srv.runForever(ctx)
         }
         if err != nil {
                 srv.Logger.Error(err)
@@ -77,7 +79,7 @@ func (srv *Server) run() {
         }
  }
  
-func (srv *Server) runOnce() (*Balancer, error) {
+func (srv *Server) runOnce(ctx context.Context) (*Balancer, error) {
         bal := &Balancer{
                 DB:             srv.DB,
                 Logger:         srv.Logger,
@@ -86,13 +88,12 @@ func (srv *Server) runOnce() (*Balancer, error) {
                 LostBlocksFile: srv.Cluster.Collections.BlobMissingReport,
         }
         var err error
-       srv.RunOptions, err = bal.Run(srv.ArvClient, srv.Cluster, srv.RunOptions)
+       srv.RunOptions, err = bal.Run(ctx, srv.ArvClient, srv.Cluster, srv.RunOptions)
         return bal, err
  }
  
-// RunForever runs forever, or (for testing purposes) until the given
-// stop channel is ready to receive.
-func (srv *Server) runForever(stop <-chan interface{}) error {
+// RunForever runs forever, or until ctx is cancelled.
+func (srv *Server) runForever(ctx context.Context) error {
         logger := srv.Logger
  
         ticker := time.NewTicker(time.Duration(srv.Cluster.Collections.BalancePeriod))
@@ -102,6 +103,10 @@ func (srv *Server) runForever(stop <-chan interface{}) error {
         sigUSR1 := make(chan os.Signal)
         signal.Notify(sigUSR1, syscall.SIGUSR1)
  
+       logger.Info("acquiring service lock")
+       dblock.KeepBalanceService.Lock(ctx, func(context.Context) (*sqlx.DB, error) { return srv.DB, nil })
+       defer dblock.KeepBalanceService.Unlock()
+
         logger.Printf("starting up: will scan every %v and on SIGUSR1", srv.Cluster.Collections.BalancePeriod)
  
         for {
@@ -110,7 +115,11 @@ func (srv *Server) runForever(stop <-chan interface{}) error {
                         logger.Print("=======  Consider using -commit-pulls and -commit-trash flags.")
                 }
  
-               _, err := srv.runOnce()
+               if !dblock.KeepBalanceService.Check() {
+                       // context canceled
+                       return nil
+               }
+               _, err := srv.runOnce(ctx)
                 if err != nil {
                         logger.Print("run failed: ", err)
                 } else {
@@ -118,7 +127,7 @@ func (srv *Server) runForever(stop <-chan interface{}) error {
                 }
  
                 select {
-               case <-stop:
+               case <-ctx.Done():
                         signal.Stop(sigUSR1)
                         return nil
                 case <-ticker.C:
diff --git a/services/keepstore/s3_volume.go b/services/keepstore/s3_volume.go

index ee89b156f796b49395fc6ec151de6ab12127e176..78737640045db53691f03f27742ffc4f495debd0 100644 (file)
--- a/services/keepstore/s3_volume.go
+++ b/services/keepstore/s3_volume.go
@@ -56,15 +56,12 @@ func (v *S3Volume) check() error {
                 return errors.New("DriverParameters: RaceWindow must not be negative")
         }
  
-       var ok bool
-       v.region, ok = aws.Regions[v.Region]
         if v.Endpoint == "" {
+               r, ok := aws.Regions[v.Region]
                 if !ok {
                         return fmt.Errorf("unrecognized region %+q; try specifying endpoint instead", v.Region)
                 }
-       } else if ok {
-               return fmt.Errorf("refusing to use AWS region name %+q with endpoint %+q; "+
-                       "specify empty endpoint or use a different region name", v.Region, v.Endpoint)
+               v.region = r
         } else {
                 v.region = aws.Region{
                         Name:                 v.Region,
diff --git a/services/keepstore/s3aws_volume.go b/services/keepstore/s3aws_volume.go

index 6205da5beb258dd8a9a354256715744c821794a6..d068dde074ea254ef814aea38eefa6f63102d7e3 100644 (file)
--- a/services/keepstore/s3aws_volume.go
+++ b/services/keepstore/s3aws_volume.go
@@ -62,6 +62,8 @@ type s3AWSbucket struct {
  // aws-sdk-go based on the UseAWSS3v2Driver feature flag
  func chooseS3VolumeDriver(cluster *arvados.Cluster, volume arvados.Volume, logger logrus.FieldLogger, metrics *volumeMetricsVecs) (Volume, error) {
         v := &S3Volume{cluster: cluster, volume: volume, metrics: metrics}
+       // Default value will be overriden if it happens to be defined in the config
+       v.S3VolumeDriverParameters.UseAWSS3v2Driver = true
         err := json.Unmarshal(volume.DriverParameters, v)
         if err != nil {
                 return nil, err
@@ -182,19 +184,25 @@ func (v *S3AWSVolume) check(ec2metadataHostname string) error {
                         if v.Endpoint != "" && service == "s3" {
                                 return aws.Endpoint{
                                         URL:           v.Endpoint,
-                                       SigningRegion: v.Region,
+                                       SigningRegion: region,
                                 }, nil
                         } else if service == "ec2metadata" && ec2metadataHostname != "" {
                                 return aws.Endpoint{
                                         URL: ec2metadataHostname,
                                 }, nil
+                       } else {
+                               return defaultResolver.ResolveEndpoint(service, region)
                         }
-
-                       return defaultResolver.ResolveEndpoint(service, region)
                 }
                 cfg.EndpointResolver = aws.EndpointResolverFunc(myCustomResolver)
         }
-
+       if v.Region == "" {
+               // Endpoint is already specified (otherwise we would
+               // have errored out above), but Region is also
+               // required by the aws sdk, in order to determine
+               // SignatureVersions.
+               v.Region = "us-east-1"
+       }
         cfg.Region = v.Region
  
         // Zero timeouts mean "wait forever", which is a bad
diff --git a/services/login-sync/arvados-login-sync.gemspec b/services/login-sync/arvados-login-sync.gemspec

index f7fe4bc1645e5fc19eb6a7a3fb72edc122dcdd06..1f8252924b1ad30d46779a6384f2c8f71ce1e187 100644 (file)
--- a/services/login-sync/arvados-login-sync.gemspec
+++ b/services/login-sync/arvados-login-sync.gemspec
@@ -37,7 +37,11 @@ Gem::Specification.new do |s|
    s.files       = ["bin/arvados-login-sync", "agpl-3.0.txt"]
    s.executables << "arvados-login-sync"
    s.required_ruby_version = '>= 2.1.0'
-  s.add_runtime_dependency 'arvados', '>= 1.3.3.20190320201707'
+  # Note the letter 'a' at the end of the version dependency. This enables
+  # bundler's dependency resolver to include 'pre-release' versions, like the
+  # ones we build (but not publish) on every test pipeline job.
+  # See: https://github.com/rubygems/bundler/issues/4340
+  s.add_runtime_dependency 'arvados', '~> 2.4', '> 2.4.4a'
    s.add_runtime_dependency 'launchy', '< 2.5'
    # We need at least version 0.8.7.3, cf. https://dev.arvados.org/issues/15673
    s.add_dependency('arvados-google-api-client', '>= 0.8.7.3', '< 0.8.9')
diff --git a/services/login-sync/bin/arvados-login-sync b/services/login-sync/bin/arvados-login-sync

index 5c6691ab95279920498875a7e49295c8a2b4a5a4..915541baf5009df2a7d290b0f47654e3d1c256ae 100755 (executable)
--- a/services/login-sync/bin/arvados-login-sync
+++ b/services/login-sync/bin/arvados-login-sync
@@ -42,9 +42,14 @@ begin
      debug = true
    end
    arv = Arvados.new({ :suppress_ssl_warnings => false })
-  logincluster_arv = Arvados.new({ :api_host => (ENV['LOGINCLUSTER_ARVADOS_API_HOST'] || ENV['ARVADOS_API_HOST']),
-                                   :api_token => (ENV['LOGINCLUSTER_ARVADOS_API_TOKEN'] || ENV['ARVADOS_API_TOKEN']),
-                      :suppress_ssl_warnings => false })
+  logincluster_host = ENV['ARVADOS_API_HOST']
+  logincluster_name = arv.cluster_config['Login']['LoginCluster'] or ''
+
+  if logincluster_name != '' and logincluster_name != arv.cluster_config['ClusterID']
+    logincluster_host = arv.cluster_config['RemoteClusters'][logincluster_name]['Host']
+  end
+  logincluster_arv = Arvados.new({ :api_host => logincluster_host,
+                                   :suppress_ssl_warnings => false })
  
    vm_uuid = ENV['ARVADOS_VIRTUAL_MACHINE_UUID']
  
@@ -219,9 +224,9 @@ begin
          userEnv = IO::read(tokenfile)
          if (m = /^ARVADOS_API_TOKEN=(.*?\n)/m.match(userEnv))
            begin
-            tmp_arv = Arvados.new({ :api_host => (ENV['LOGINCLUSTER_ARVADOS_API_HOST'] || ENV['ARVADOS_API_HOST']),
-                                   :api_token => (m[1]),
-                      :suppress_ssl_warnings => false })
+            tmp_arv = Arvados.new({ :api_host => logincluster_host,
+                                    :api_token => (m[1]),
+                                    :suppress_ssl_warnings => false })
              tmp_arv.user.current
            rescue Arvados::TransactionFailedError => e
              if e.to_s =~ /401 Unauthorized/
diff --git a/tools/arvbox/bin/arvbox b/tools/arvbox/bin/arvbox

index e7416947d65d2abd5023f77f1b4de997b71c910d..b3b9a5fcb441900535954012ebc0ee05f77bf10f 100755 (executable)
--- a/tools/arvbox/bin/arvbox
+++ b/tools/arvbox/bin/arvbox
@@ -44,10 +44,6 @@ if test -z "$ARVADOS_ROOT" ; then
      ARVADOS_ROOT="$ARVBOX_DATA/arvados"
  fi
  
-if test -z "$COMPOSER_ROOT" ; then
-    COMPOSER_ROOT="$ARVBOX_DATA/composer"
-fi
-
  if test -z "$WORKBENCH2_ROOT" ; then
      WORKBENCH2_ROOT="$ARVBOX_DATA/workbench2"
  fi
@@ -138,7 +134,6 @@ wait_for_arvbox() {
  docker_run_dev() {
      docker run \
             "--volume=$ARVADOS_ROOT:/usr/src/arvados:rw" \
-           "--volume=$COMPOSER_ROOT:/usr/src/composer:rw" \
             "--volume=$WORKBENCH2_ROOT:/usr/src/workbench2:rw" \
             "--volume=$PG_DATA:/var/lib/postgresql:rw" \
             "--volume=$VAR_DATA:$ARVADOS_CONTAINER_PATH:rw" \
@@ -257,10 +252,6 @@ run() {
              git clone https://git.arvados.org/arvados.git "$ARVADOS_ROOT"
             git -C "$ARVADOS_ROOT" checkout $ARVADOS_BRANCH
          fi
-        if ! test -d "$COMPOSER_ROOT" ; then
-            git clone https://github.com/arvados/composer.git "$COMPOSER_ROOT"
-            git -C "$COMPOSER_ROOT" checkout arvados-fork
-        fi
          if ! test -d "$WORKBENCH2_ROOT" ; then
              git clone https://git.arvados.org/arvados-workbench2.git "$WORKBENCH2_ROOT"
             git -C "$ARVADOS_ROOT" checkout $WORKBENCH2_BRANCH
@@ -613,7 +604,6 @@ case "$subcmd" in
                 "$ARVBOX_BASE/$1/gopath" \
                 "$ARVBOX_BASE/$1/Rlibs" \
                 "$ARVBOX_BASE/$1/arvados" \
-               "$ARVBOX_BASE/$1/composer" \
                 "$ARVBOX_BASE/$1/workbench2" \
                 "$ARVBOX_BASE/$2"
              echo "Created new arvbox $2"
diff --git a/tools/arvbox/lib/arvbox/docker/common.sh b/tools/arvbox/lib/arvbox/docker/common.sh

index 4e95bdedfc465ac0c3c25065e2dd778f0b949775..d900f0377207a7a0717ec49c84643e8a9367aff9 100644 (file)
--- a/tools/arvbox/lib/arvbox/docker/common.sh
+++ b/tools/arvbox/lib/arvbox/docker/common.sh
@@ -15,6 +15,10 @@ export ARVADOS_CONTAINER_PATH=/var/lib/arvados-arvbox
  export GEM_HOME=$HOME/.gem
  GEMLOCK=$HOME/gems.lock
  
+export LANG=en_US.UTF-8
+export LANGUAGE=en_US:en
+export LC_ALL=en_US.UTF-8
+
  defaultdev=$(/sbin/ip route|awk '/default/ { print $5 }')
  dockerip=$(/sbin/ip route | grep default | awk '{ print $3 }')
  containerip=$(ip addr show $defaultdev | grep 'inet ' | sed 's/ *inet \(.*\)\/.*/\1/')
@@ -74,6 +78,11 @@ run_bundler() {
         # If present, use the one associated with rails workbench or API
         BUNDLER=$PWD/bin/bundle
      fi
+
+    if test -z "$(flock $GEMLOCK /var/lib/arvados/bin/gem list | grep 'arvados[[:blank:]].*[0-9.]*dev')" ; then
+        (cd /usr/src/arvados/sdk/ruby && \
+        /var/lib/arvados/bin/gem build arvados.gemspec && flock $GEMLOCK /var/lib/arvados/bin/gem install $(ls -1 *.gem | sort -r | head -n1))
+    fi
      if ! flock $GEMLOCK $BUNDLER install --verbose --local --no-deployment $frozen "$@" ; then
          flock $GEMLOCK $BUNDLER install --verbose --no-deployment $frozen "$@"
      fi
diff --git a/tools/arvbox/lib/arvbox/docker/service/ready/run-service b/tools/arvbox/lib/arvbox/docker/service/ready/run-service

index 5007fe0be3e8e459fdd107246b5987b324051bfd..1e9aae0c45eb6a4685324c6edcc99504f6bf3dff 100755 (executable)
--- a/tools/arvbox/lib/arvbox/docker/service/ready/run-service
+++ b/tools/arvbox/lib/arvbox/docker/service/ready/run-service
@@ -89,7 +89,8 @@ fi
  
  echo
  echo "Your Arvados-in-a-box is ready!"
-echo "Workbench is running at https://$localip"
-echo "Workbench2 is running at https://$localip:${services[workbench2-ssl]}"
+echo "Workbench is hosted at https://$localip"
+echo "Workbench2 is hosted at https://$localip:${services[workbench2-ssl]}"
+echo "Documentation is hosted at http://$localip:${services[doc]}"
  
  rm -r /tmp/arvbox-ready
diff --git a/tools/arvbox/lib/arvbox/docker/service/sdk/run-service b/tools/arvbox/lib/arvbox/docker/service/sdk/run-service

index 62eb50c7a17387e8ed1bef6ab4fbc334a96a82c9..d3ff7e868345b383fb7c98e27a88a36ad44db1ed 100755 (executable)
--- a/tools/arvbox/lib/arvbox/docker/service/sdk/run-service
+++ b/tools/arvbox/lib/arvbox/docker/service/sdk/run-service
@@ -14,6 +14,9 @@ cat > ~/.pip/pip.conf <<EOF
  download_cache = /var/lib/pip
  EOF
  
+cd /usr/src/arvados/sdk/ruby
+run_bundler --binstubs=binstubs
+
  cd /usr/src/arvados/sdk/cli
  run_bundler --binstubs=binstubs
  
diff --git a/tools/salt-install/config_examples/multi_host/aws/pillars/nginx_controller_configuration.sls b/tools/salt-install/config_examples/multi_host/aws/pillars/nginx_controller_configuration.sls

index 869cc596a3e3cafdf3698eee8847dad78d9ebd5e..5df1870c808846c219b6fa845fc32af939908a09 100644 (file)
--- a/tools/salt-install/config_examples/multi_host/aws/pillars/nginx_controller_configuration.sls
+++ b/tools/salt-install/config_examples/multi_host/aws/pillars/nginx_controller_configuration.sls
@@ -55,6 +55,8 @@ nginx:
                - proxy_set_header: 'X-Real-IP $remote_addr'
                - proxy_set_header: 'X-Forwarded-For $proxy_add_x_forwarded_for'
                - proxy_set_header: 'X-External-Client $external_client'
+              - proxy_set_header: 'Upgrade $http_upgrade'
+              - proxy_set_header: 'Connection "upgrade"'
                - proxy_max_temp_file_size: 0
                - proxy_request_buffering: 'off'
                - proxy_buffering: 'off'
diff --git a/tools/salt-install/config_examples/single_host/multiple_hostnames/pillars/nginx_controller_configuration.sls b/tools/salt-install/config_examples/single_host/multiple_hostnames/pillars/nginx_controller_configuration.sls

index bc28fd82595c3d39a8b657d674812b12013ff317..2b01237889a10186fdc9028d7ff8e8bd2765978f 100644 (file)
--- a/tools/salt-install/config_examples/single_host/multiple_hostnames/pillars/nginx_controller_configuration.sls
+++ b/tools/salt-install/config_examples/single_host/multiple_hostnames/pillars/nginx_controller_configuration.sls
@@ -54,6 +54,8 @@ nginx:
                - proxy_set_header: 'X-Real-IP $remote_addr'
                - proxy_set_header: 'X-Forwarded-For $proxy_add_x_forwarded_for'
                - proxy_set_header: 'X-External-Client $external_client'
+              - proxy_set_header: 'Upgrade $http_upgrade'
+              - proxy_set_header: 'Connection "upgrade"'
                - proxy_max_temp_file_size: 0
                - proxy_request_buffering: 'off'
                - proxy_buffering: 'off'
diff --git a/tools/salt-install/config_examples/single_host/single_hostname/pillars/nginx_controller_configuration.sls b/tools/salt-install/config_examples/single_host/single_hostname/pillars/nginx_controller_configuration.sls

index 3058367bc006992342559321696fb7b96664150c..55d54cf1cba84dab338b1eb5141352ae6f745714 100644 (file)
--- a/tools/salt-install/config_examples/single_host/single_hostname/pillars/nginx_controller_configuration.sls
+++ b/tools/salt-install/config_examples/single_host/single_hostname/pillars/nginx_controller_configuration.sls
@@ -54,6 +54,8 @@ nginx:
                - proxy_set_header: 'X-Real-IP $remote_addr'
                - proxy_set_header: 'X-Forwarded-For $proxy_add_x_forwarded_for'
                - proxy_set_header: 'X-External-Client $external_client'
+              - proxy_set_header: 'Upgrade $http_upgrade'
+              - proxy_set_header: 'Connection "upgrade"'
                - proxy_max_temp_file_size: 0
                - proxy_request_buffering: 'off'
                - proxy_buffering: 'off'
diff --git a/tools/user-activity/arvados_user_activity/main.py b/tools/user-activity/arvados_user_activity/main.py

index 3109e9f6662654f8bc70deb4f686eda43e66ea1f..ded96c3121c0cc8d020b401c4e8b39da791bbdac 100755 (executable)
--- a/tools/user-activity/arvados_user_activity/main.py
+++ b/tools/user-activity/arvados_user_activity/main.py
@@ -95,20 +95,20 @@ def getuserinfocsv(arv, uuid):
  collectionNameCache = {}
  def getCollectionName(arv, uuid, pdh):
      lookupField = uuid
-    filters = [["uuid","=",uuid]]
+    filters = [["uuid", "=", uuid]]
      cached = uuid in collectionNameCache
      # look up by uuid if it is available, fall back to look up by pdh
-    if len(uuid) != 27:
+    if uuid is None or len(uuid) != 27:
          # Look up by pdh. Note that this can be misleading; the download could
          # have happened from a collection with the same pdh but different name.
          # We arbitrarily pick the oldest collection with the pdh to lookup the
          # name, if the uuid for the request is not known.
          lookupField = pdh
-        filters = [["portable_data_hash","=",pdh]]
+        filters = [["portable_data_hash", "=", pdh]]
          cached = pdh in collectionNameCache
  
      if not cached:
-        u = arv.collections().list(filters=filters,order="created_at",limit=1).execute().get("items")
+        u = arv.collections().list(filters=filters, order="created_at", limit=1).execute().get("items")
          if len(u) < 1:
              return "(deleted)"
          collectionNameCache[lookupField] = u[0]["name"]
@@ -208,20 +208,19 @@ def main(arguments=None):
                  users[owner].append([loguuid, event_at, "Deleted collection %s" % (getname(e["properties"]["old_attributes"]))])
  
          elif e["event_type"] == "file_download":
-                users.setdefault(e["object_uuid"], [])
-                users[e["object_uuid"]].append([loguuid, event_at, "Downloaded file \"%s\" from \"%s\" (%s) (%s)" % (
-                                                                                       e["properties"].get("collection_file_path") or e["properties"].get("reqPath"),
-                                                                                       getCollectionName(arv, e["properties"].get("collection_uuid"), e["properties"].get("portable_data_hash")),
-                                                                                       e["properties"].get("collection_uuid"),
-                                                                                       e["properties"].get("portable_data_hash"))])
-
+            users.setdefault(e["object_uuid"], [])
+            users[e["object_uuid"]].append([loguuid, event_at, "Downloaded file \"%s\" from \"%s\" (%s) (%s)" % (
+                e["properties"].get("collection_file_path") or e["properties"].get("reqPath"),
+                getCollectionName(arv, e["properties"].get("collection_uuid"), e["properties"].get("portable_data_hash")),
+                e["properties"].get("collection_uuid"),
+                e["properties"].get("portable_data_hash"))])
  
          elif e["event_type"] == "file_upload":
-                users.setdefault(e["object_uuid"], [])
-                users[e["object_uuid"]].append([loguuid, event_at, "Uploaded file \"%s\" to \"%s\" (%s)" % (
-                                                                                    e["properties"].get("collection_file_path") or e["properties"].get("reqPath"),
-                                                                                    getCollectionName(arv, e["properties"].get("collection_uuid"), e["properties"].get("portable_data_hash")),
-                                                                                    e["properties"].get("collection_uuid"))])
+            users.setdefault(e["object_uuid"], [])
+            users[e["object_uuid"]].append([loguuid, event_at, "Uploaded file \"%s\" to \"%s\" (%s)" % (
+                e["properties"].get("collection_file_path") or e["properties"].get("reqPath"),
+                getCollectionName(arv, e["properties"].get("collection_uuid"), e["properties"].get("portable_data_hash")),
+                e["properties"].get("collection_uuid"))])
  
          else:
              users[owner].append([loguuid, event_at, "%s %s %s" % (e["event_type"], e["object_kind"], e["object_uuid"])])
author	Peter Amstutz <peter.amstutz@curii.com>
	Mon, 5 Dec 2022 18:43:01 +0000 (13:43 -0500)
committer	Peter Amstutz <peter.amstutz@curii.com>
	Mon, 5 Dec 2022 18:43:01 +0000 (13:43 -0500)
.gitignore		patch \| blob \| history
apps/workbench/Gemfile.lock		patch \| blob \| history
apps/workbench/app/helpers/version_helper.rb		patch \| blob \| history
apps/workbench/app/views/users/_tables.html.erb		patch \| blob \| history
apps/workbench/test/integration/report_issue_test.rb		patch \| blob \| history
build/package-build-dockerfiles/centos7/Dockerfile		patch \| blob \| history
build/run-build-packages-one-target.sh		patch \| blob \| history
build/run-build-packages.sh		patch \| blob \| history
build/run-library.sh		patch \| blob \| history
build/run-tests.sh		patch \| blob \| history
doc/_config.yml		patch \| blob \| history
doc/admin/diagnostics.html.textile.liquid	[new file with mode: 0644]	patch \| blob
doc/admin/federation.html.textile.liquid		patch \| blob \| history
doc/admin/group-management.html.textile.liquid		patch \| blob \| history
doc/admin/health-checks.html.textile.liquid		patch \| blob \| history
doc/admin/maintenance-and-upgrading.html.textile.liquid		patch \| blob \| history
doc/admin/upgrading.html.textile.liquid		patch \| blob \| history
doc/api/methods/groups.html.textile.liquid		patch \| blob \| history
doc/api/projects.html.textile.liquid		patch \| blob \| history
doc/api/properties.html.textile.liquid	[new file with mode: 0644]	patch \| blob
doc/architecture/federation.html.textile.liquid		patch \| blob \| history
doc/install/configure-s3-object-storage.html.textile.liquid		patch \| blob \| history
doc/install/crunch2-cloud/install-dispatch-cloud.html.textile.liquid		patch \| blob \| history
doc/install/crunch2-lsf/install-dispatch.html.textile.liquid		patch \| blob \| history
doc/install/crunch2-slurm/install-test.html.textile.liquid		patch \| blob \| history
doc/install/install-shell-server.html.textile.liquid		patch \| blob \| history
doc/sdk/index.html.textile.liquid		patch \| blob \| history
doc/sdk/perl/example.html.textile.liquid	[deleted file]	patch \| blob \| history
doc/sdk/perl/index.html.textile.liquid	[deleted file]	patch \| blob \| history
doc/sdk/python/cookbook.html.textile.liquid		patch \| blob \| history
doc/user/cwl/cwl-run-options.html.textile.liquid		patch \| blob \| history
doc/user/cwl/cwl-style.html.textile.liquid		patch \| blob \| history
lib/config/config.default.yml		patch \| blob \| history
lib/config/export.go		patch \| blob \| history
lib/controller/dblock/dblock.go		patch \| blob \| history
lib/controller/dblock/dblock_test.go	[new file with mode: 0644]	patch \| blob
lib/controller/federation.go		patch \| blob \| history
lib/controller/federation/conn.go		patch \| blob \| history
lib/controller/federation/generate.go		patch \| blob \| history
lib/controller/federation/generated.go		patch \| blob \| history
lib/controller/federation/list.go		patch \| blob \| history
lib/controller/federation/login_test.go		patch \| blob \| history
lib/controller/handler.go		patch \| blob \| history
lib/controller/handler_test.go		patch \| blob \| history
lib/controller/localdb/collection.go		patch \| blob \| history
lib/controller/localdb/conn.go		patch \| blob \| history
lib/controller/localdb/container_request.go		patch \| blob \| history
lib/controller/localdb/group.go		patch \| blob \| history
lib/controller/localdb/log_activity.go	[new file with mode: 0644]	patch \| blob
lib/controller/localdb/log_activity_test.go	[new file with mode: 0644]	patch \| blob
lib/controller/localdb/login.go		patch \| blob \| history
lib/controller/localdb/login_oidc.go		patch \| blob \| history
lib/controller/localdb/login_oidc_test.go		patch \| blob \| history
lib/controller/localdb/login_testuser_test.go		patch \| blob \| history
lib/controller/localdb/logout.go		patch \| blob \| history
lib/controller/router/router.go		patch \| blob \| history
lib/controller/rpc/conn.go		patch \| blob \| history
lib/controller/trash.go		patch \| blob \| history
lib/crunchrun/crunchrun.go		patch \| blob \| history
lib/crunchstat/crunchstat.go		patch \| blob \| history
lib/crunchstat/crunchstat_test.go		patch \| blob \| history
lib/ctrlctx/auth.go	[new file with mode: 0644]	patch \| blob
lib/ctrlctx/auth_test.go	[new file with mode: 0644]	patch \| blob
lib/ctrlctx/db.go		patch \| blob \| history
lib/diagnostics/cmd.go		patch \| blob \| history
lib/dispatchcloud/dispatcher.go		patch \| blob \| history
lib/dispatchcloud/dispatcher_test.go		patch \| blob \| history
lib/dispatchcloud/node_size.go		patch \| blob \| history
lib/dispatchcloud/node_size_test.go		patch \| blob \| history
lib/install/deps.go		patch \| blob \| history
lib/lsf/dispatch.go		patch \| blob \| history
lib/lsf/dispatch_test.go		patch \| blob \| history
lib/pam/testclient.go		patch \| blob \| history
sdk/cwl/arvados_cwl/__init__.py		patch \| blob \| history
sdk/cwl/arvados_cwl/arvcontainer.py		patch \| blob \| history
sdk/cwl/arvados_cwl/arvworkflow.py		patch \| blob \| history
sdk/cwl/arvados_cwl/context.py		patch \| blob \| history
sdk/cwl/arvados_cwl/executor.py		patch \| blob \| history
sdk/cwl/arvados_cwl/fsaccess.py		patch \| blob \| history
sdk/cwl/arvados_cwl/http.py		patch \| blob \| history
sdk/cwl/arvados_cwl/pathmapper.py		patch \| blob \| history
sdk/cwl/arvados_cwl/runner.py		patch \| blob \| history
sdk/cwl/setup.py		patch \| blob \| history
sdk/cwl/tests/19678-name-id.cwl	[new file with mode: 0644]	patch \| blob
sdk/cwl/tests/arvados-tests.yml		patch \| blob \| history
sdk/cwl/tests/collection_per_tool/collection_per_tool_wrapper.cwl	[new file with mode: 0644]	patch \| blob
sdk/cwl/tests/test_container.py		patch \| blob \| history
sdk/cwl/tests/test_http.py		patch \| blob \| history
sdk/cwl/tests/test_submit.py		patch \| blob \| history
sdk/cwl/tests/wf/expect_upload_wrapper.cwl	[new file with mode: 0644]	patch \| blob
sdk/cwl/tests/wf/expect_upload_wrapper_altname.cwl	[new file with mode: 0644]	patch \| blob
sdk/dev-jobs.dockerfile		patch \| blob \| history
sdk/go/arvados/api.go		patch \| blob \| history
sdk/go/arvados/client.go		patch \| blob \| history
sdk/go/arvados/config.go		patch \| blob \| history
sdk/go/arvados/container.go		patch \| blob \| history
sdk/go/arvados/duration.go		patch \| blob \| history
sdk/go/arvados/duration_test.go		patch \| blob \| history
sdk/go/arvados/fs_collection.go		patch \| blob \| history
sdk/go/arvados/log.go		patch \| blob \| history
sdk/go/arvados/vocabulary.go		patch \| blob \| history
sdk/go/arvados/vocabulary_test.go		patch \| blob \| history
sdk/go/arvadostest/api.go		patch \| blob \| history
sdk/go/arvadostest/db.go		patch \| blob \| history
sdk/go/health/aggregator.go		patch \| blob \| history
sdk/go/health/aggregator_test.go		patch \| blob \| history
sdk/go/keepclient/block_cache.go		patch \| blob \| history
sdk/perl/.gitignore	[deleted file]	patch \| blob \| history
sdk/perl/Makefile.PL	[deleted file]	patch \| blob \| history
sdk/perl/lib/Arvados.pm	[deleted file]	patch \| blob \| history
sdk/perl/lib/Arvados/Request.pm	[deleted file]	patch \| blob \| history
sdk/perl/lib/Arvados/ResourceAccessor.pm	[deleted file]	patch \| blob \| history
sdk/perl/lib/Arvados/ResourceMethod.pm	[deleted file]	patch \| blob \| history
sdk/perl/lib/Arvados/ResourceProxy.pm	[deleted file]	patch \| blob \| history
sdk/perl/lib/Arvados/ResourceProxyList.pm	[deleted file]	patch \| blob \| history
sdk/python/README.rst		patch \| blob \| history
sdk/python/arvados/collection.py		patch \| blob \| history
sdk/python/arvados/diskcache.py	[new file with mode: 0644]	patch \| blob
sdk/python/arvados/errors.py		patch \| blob \| history
sdk/python/arvados/keep.py		patch \| blob \| history
sdk/python/arvados/retry.py		patch \| blob \| history
sdk/python/setup.py		patch \| blob \| history
sdk/python/tests/arvados_testutil.py		patch \| blob \| history
sdk/python/tests/run_test_server.py		patch \| blob \| history
sdk/python/tests/test_collections.py		patch \| blob \| history
sdk/python/tests/test_keep_client.py		patch \| blob \| history
sdk/ruby/lib/arvados.rb		patch \| blob \| history
sdk/ruby/lib/arvados/keep.rb		patch \| blob \| history
services/api/Gemfile.lock		patch \| blob \| history
services/api/app/models/api_client.rb		patch \| blob \| history
services/api/app/models/arvados_model.rb		patch \| blob \| history
services/api/app/models/container.rb		patch \| blob \| history
services/api/app/models/user.rb		patch \| blob \| history
services/api/lib/tasks/delete_old_container_logs.rake		patch \| blob \| history
services/api/test/fixtures/containers.yml		patch \| blob \| history
services/api/test/functional/arvados/v1/collections_controller_test.rb		patch \| blob \| history
services/api/test/integration/users_test.rb		patch \| blob \| history
services/api/test/tasks/delete_old_container_logs_test.rb	[deleted file]	patch \| blob \| history
services/api/test/unit/container_request_test.rb		patch \| blob \| history
services/api/test/unit/container_test.rb		patch \| blob \| history
services/crunch-dispatch-slurm/crunch-dispatch-slurm.go		patch \| blob \| history
services/crunchstat/crunchstat.go		patch \| blob \| history
services/fuse/README.rst		patch \| blob \| history
services/fuse/arvados_fuse/command.py		patch \| blob \| history
services/fuse/setup.py		patch \| blob \| history
services/fuse/tests/mount_test_base.py		patch \| blob \| history
services/fuse/tests/test_mount.py		patch \| blob \| history
services/keep-balance/balance.go		patch \| blob \| history
services/keep-balance/balance_run_test.go		patch \| blob \| history
services/keep-balance/integration_test.go		patch \| blob \| history
services/keep-balance/main.go		patch \| blob \| history
services/keep-balance/server.go		patch \| blob \| history
services/keepstore/s3_volume.go		patch \| blob \| history
services/keepstore/s3aws_volume.go		patch \| blob \| history
services/login-sync/arvados-login-sync.gemspec		patch \| blob \| history
services/login-sync/bin/arvados-login-sync		patch \| blob \| history
tools/arvbox/bin/arvbox		patch \| blob \| history
tools/arvbox/lib/arvbox/docker/common.sh		patch \| blob \| history
tools/arvbox/lib/arvbox/docker/service/ready/run-service		patch \| blob \| history
tools/arvbox/lib/arvbox/docker/service/sdk/run-service		patch \| blob \| history
tools/salt-install/config_examples/multi_host/aws/pillars/nginx_controller_configuration.sls		patch \| blob \| history
tools/salt-install/config_examples/single_host/multiple_hostnames/pillars/nginx_controller_configuration.sls		patch \| blob \| history
tools/salt-install/config_examples/single_host/single_hostname/pillars/nginx_controller_configuration.sls		patch \| blob \| history
tools/user-activity/arvados_user_activity/main.py		patch \| blob \| history