7 echo >&2 "usage: $0 [options] <identifier>"
9 echo >&2 " <identifier> Arvados cluster name"
11 echo >&2 "$0 options:"
12 echo >&2 " -d, --debug Enable debug output"
13 echo >&2 " -h, --help Display this help and exit"
15 echo >&2 "Note: this script requires an arvados token created with these permissions:"
16 echo >&2 ' arv api_client_authorization create_system_auth \'
17 echo >&2 ' --scopes "[\"GET /arvados/v1/virtual_machines\",'
18 echo >&2 ' \"GET /arvados/v1/keep_services\",'
19 echo >&2 ' \"GET /arvados/v1/keep_services/\",'
20 echo >&2 ' \"GET /arvados/v1/groups\",'
21 echo >&2 ' \"GET /arvados/v1/groups/\",'
22 echo >&2 ' \"GET /arvados/v1/links\",'
23 echo >&2 ' \"GET /arvados/v1/collections\",'
24 echo >&2 ' \"POST /arvados/v1/collections\",'
25 echo >&2 ' \"POST /arvados/v1/links\"]"'
29 # NOTE: This requires GNU getopt (part of the util-linux package on Debian-based distros).
34 if [ $? != 0 ] ; then echo "Use -h for help"; exit 1 ; fi
35 # Note the quotes around `$TEMP': they are essential!
58 if [[ "$IDENTIFIER" == '' ]]; then
69 let endtime="$(now) + 600"
70 while [ "$endtime" -gt "$(now)" ]; do
71 puppet agent --test --detailed-exitcodes
73 if [ 0 = "$agent_exitcode" ] || [ 2 = "$agent_exitcode" ]; then
79 exit ${agent_exitcode:-99}
83 date=`date +'%Y-%m-%d %H:%M:%S'`
87 function run_puppet() {
91 title "Running puppet on $node"
93 if [[ "$DEBUG" != "0" ]]; then
94 ssh -t -p2222 -o "StrictHostKeyChecking no" -o "ConnectTimeout 5" root@$node -C bash -c "'$PUPPET_AGENT'" | tee $TMP_FILE
96 ssh -t -p2222 -o "StrictHostKeyChecking no" -o "ConnectTimeout 5" root@$node -C bash -c "'$PUPPET_AGENT'" > $TMP_FILE 2>&1
99 ECODE=${PIPESTATUS[0]}
100 RESULT=$(cat $TMP_FILE)
102 if [[ "$ECODE" != "255" && ! ("$RESULT" =~ 'already in progress') && "$ECODE" != "2" && "$ECODE" != "0" ]]; then
103 # Ssh exits 255 if the connection timed out. Just ignore that.
104 # Puppet exits 2 if there are changes. For real!
105 # Puppet prints 'Notice: Run of Puppet configuration client already in progress' if another puppet process
106 # was already running
107 echo "ERROR running puppet on $node: exit code $ECODE"
108 if [[ "$DEBUG" == "0" ]]; then
109 title "Command output follows:"
113 if [[ "$ECODE" == "255" ]]; then
114 title "Connection timed out"
117 if [[ "$ECODE" == "2" ]]; then
121 eval "$return_var=$ECODE"
124 function run_command() {
129 title "Running '$command' on $node"
131 if [[ "$DEBUG" != "0" ]]; then
132 ssh -t -p2222 -o "StrictHostKeyChecking no" -o "ConnectTimeout 5" root@$node -C "$command" | tee $TMP_FILE
134 ssh -t -p2222 -o "StrictHostKeyChecking no" -o "ConnectTimeout 5" root@$node -C "$command" > $TMP_FILE 2>&1
138 RESULT=$(cat $TMP_FILE)
140 if [[ "$ECODE" != "255" && "$ECODE" != "0" ]]; then
141 # Ssh exists 255 if the connection timed out. Just ignore that, it's possible that this node is
142 # a shell node that is down.
143 title "ERROR running command on $node: exit code $ECODE"
144 if [[ "$DEBUG" == "0" ]]; then
145 title "Command output follows:"
149 if [[ "$ECODE" == "255" ]]; then
150 title "Connection timed out"
154 eval "$return_var=$ECODE"
157 title "Updating API server"
159 run_puppet $IDENTIFIER.arvadosapi.com ECODE
160 SUM_ECODE=$(($SUM_ECODE + $ECODE))
161 run_command $IDENTIFIER.arvadosapi.com ECODE "/usr/local/rvm/bin/rvm-exec /usr/local/bin/arvados-api-server-upgrade.sh"
162 SUM_ECODE=$(($SUM_ECODE + $ECODE))
163 if [ ! "$IDENTIFIER" = "c97qk" ]
165 run_command $IDENTIFIER.arvadosapi.com ECODE "dpkg -L arvados-mailchimp-plugin 2>/dev/null && apt-get install arvados-mailchimp-plugin --reinstall || echo"
166 SUM_ECODE=$(($SUM_ECODE + $ECODE))
169 if [[ "$SUM_ECODE" != "0" ]]; then
170 title "ERROR: Updating API server FAILED"
171 EXITCODE=$(($EXITCODE + $SUM_ECODE))
175 title "Loading ARVADOS_API_HOST and ARVADOS_API_TOKEN"
176 if [[ -f "$HOME/.config/arvados/$IDENTIFIER.arvadosapi.com.conf" ]]; then
177 . $HOME/.config/arvados/$IDENTIFIER.arvadosapi.com.conf
179 title "WARNING: $HOME/.config/arvados/$IDENTIFIER.arvadosapi.com.conf not found."
181 if [[ "$ARVADOS_API_HOST" == "" ]] || [[ "$ARVADOS_API_TOKEN" == "" ]]; then
182 title "ERROR: ARVADOS_API_HOST and/or ARVADOS_API_TOKEN environment variables are not set."
186 title "Locating Arvados Standard Docker images project"
188 JSON_FILTER="[[\"name\", \"=\", \"Arvados Standard Docker Images\"], [\"owner_uuid\", \"=\", \"$IDENTIFIER-tpzed-000000000000000\"]]"
189 DOCKER_IMAGES_PROJECT=`ARVADOS_API_HOST=$ARVADOS_API_HOST ARVADOS_API_TOKEN=$ARVADOS_API_TOKEN arv --format=uuid group list --filters="$JSON_FILTER"`
191 if [[ "$DOCKER_IMAGES_PROJECT" == "" ]]; then
192 title "Warning: Arvados Standard Docker Images project not found. Creating it."
194 DOCKER_IMAGES_PROJECT=`ARVADOS_API_HOST=$ARVADOS_API_HOST ARVADOS_API_TOKEN=$ARVADOS_API_TOKEN arv --format=uuid group create --group "{\"owner_uuid\":\"$IDENTIFIER-tpzed-000000000000000\", \"name\":\"Arvados Standard Docker Images\", \"group_class\":\"project\"}"`
195 ARVADOS_API_HOST=$ARVADOS_API_HOST ARVADOS_API_TOKEN=$ARVADOS_API_TOKEN arv link create --link "{\"tail_uuid\":\"$IDENTIFIER-j7d0g-fffffffffffffff\", \"head_uuid\":\"$DOCKER_IMAGES_PROJECT\", \"link_class\":\"permission\", \"name\":\"can_read\" }"
196 if [[ "$?" != "0" ]]; then
197 title "ERROR: could not create standard Docker images project Please create it, cf. http://doc.arvados.org/install/create-standard-objects.html"
202 title "Found Arvados Standard Docker Images project with uuid $DOCKER_IMAGES_PROJECT"
203 GIT_COMMIT=`ssh -o "StrictHostKeyChecking no" $IDENTIFIER cat /usr/local/arvados/src/git-commit.version`
205 if [[ "$?" != "0" ]] || [[ "$GIT_COMMIT" == "" ]]; then
206 title "ERROR: unable to get arvados/jobs Docker image git revision"
209 title "Found git commit for arvados/jobs Docker image: $GIT_COMMIT"
212 run_command shell.$IDENTIFIER ECODE "ARVADOS_API_HOST=$ARVADOS_API_HOST ARVADOS_API_TOKEN=$ARVADOS_API_TOKEN /usr/local/rvm/bin/rvm-exec default arv keep docker" |grep -q $GIT_COMMIT
214 if [[ "$?" == "0" ]]; then
215 title "Found latest arvados/jobs Docker image, nothing to upload"
217 title "Installing latest arvados/jobs Docker image"
218 ssh -o "StrictHostKeyChecking no" shell.$IDENTIFIER "ARVADOS_API_HOST=$ARVADOS_API_HOST ARVADOS_API_TOKEN=$ARVADOS_API_TOKEN /usr/local/rvm/bin/rvm-exec default arv keep docker --pull --project-uuid=$DOCKER_IMAGES_PROJECT arvados/jobs $GIT_COMMIT"
219 if [[ "$?" -ne 0 ]]; then
220 title "'git pull' failed exiting..."
225 title "Gathering list of shell and Keep nodes"
226 SHELL_NODES=`ARVADOS_API_HOST=$ARVADOS_API_HOST ARVADOS_API_TOKEN=$ARVADOS_API_TOKEN arv virtual_machine list |jq .items[].hostname -r`
227 KEEP_NODES=`ARVADOS_API_HOST=$ARVADOS_API_HOST ARVADOS_API_TOKEN=$ARVADOS_API_TOKEN arv keep_service list |jq .items[].service_host -r`
229 title "Updating workbench"
231 if [[ `host workbench.$ARVADOS_API_HOST |cut -f4 -d' '` != `host $ARVADOS_API_HOST |cut -f4 -d' '` ]]; then
232 # Workbench runs on a separate host. We need to run puppet there too.
233 run_puppet workbench.$IDENTIFIER ECODE
234 SUM_ECODE=$(($SUM_ECODE + $ECODE))
237 run_command workbench.$IDENTIFIER ECODE "/usr/local/rvm/bin/rvm-exec /usr/local/bin/arvados-workbench-upgrade.sh"
238 SUM_ECODE=$(($SUM_ECODE + $ECODE))
240 if [[ "$SUM_ECODE" != "0" ]]; then
241 title "ERROR: Updating workbench FAILED"
242 EXITCODE=$(($EXITCODE + $SUM_ECODE))
246 for n in manage switchyard $SHELL_NODES $KEEP_NODES; do
248 if [[ $n =~ $ARVADOS_API_HOST$ ]]; then
249 # e.g. keep.qr1hi.arvadosapi.com
253 node=$n.$ARVADOS_API_HOST
257 node=${node%.arvadosapi.com}
259 title "Updating $node"
260 run_puppet $node ECODE
261 if [[ "$ECODE" != "0" ]]; then
262 title "ERROR: Updating $node node FAILED: exit code $ECODE"
263 EXITCODE=$(($EXITCODE + $ECODE))