X-Git-Url: https://git.arvados.org/arvados.git/blobdiff_plain/8e13c05a464c8d9a3ac543f706f814a7a02d249f..1d068f13d0c9148dcee20c7802bf61956f8e3267:/tools/salt-install/provision.sh diff --git a/tools/salt-install/provision.sh b/tools/salt-install/provision.sh index ec64a97b8b..a93899a61a 100755 --- a/tools/salt-install/provision.sh +++ b/tools/salt-install/provision.sh @@ -10,6 +10,7 @@ # # vagrant up +set -eu set -o pipefail # capture the directory that the script is running from @@ -25,13 +26,14 @@ usage() { echo >&2 " -t, --test Test installation running a CWL workflow" echo >&2 " -r, --roles List of Arvados roles to apply to the host, comma separated" echo >&2 " Possible values are:" - echo >&2 " api" + echo >&2 " balancer" echo >&2 " controller" echo >&2 " dispatcher" echo >&2 " keepproxy" echo >&2 " keepbalance" echo >&2 " keepstore" echo >&2 " keepweb" + echo >&2 " monitoring" echo >&2 " shell" echo >&2 " webshell" echo >&2 " websocket" @@ -41,13 +43,13 @@ usage() { echo >&2 " -h, --help Display this help and exit" echo >&2 " --dump-config Dumps the pillars and states to a directory" echo >&2 " This parameter does not perform any installation at all. It's" - echo >&2 " intended to give you a parsed sot of configuration files so" + echo >&2 " intended to give you a parsed set of configuration files so" echo >&2 " you can inspect them or use them in you Saltstack infrastructure." echo >&2 " It" echo >&2 " - parses the pillar and states templates," echo >&2 " - downloads the helper formulas with their desired versions," echo >&2 " - prepares the 'top.sls' files both for pillars and states" - echo >&2 " for the selected role/s" + echo >&2 " for the selected role(s)" echo >&2 " - writes the resulting files into " echo >&2 " -v, --vagrant Run in vagrant and use the /vagrant shared dir" echo >&2 " --development Run in dev mode, using snakeoil certs" @@ -108,12 +110,12 @@ arguments() { for i in ${2//,/ } do # Verify the role exists - if [[ ! "database,api,controller,keepstore,websocket,keepweb,workbench2,webshell,keepbalance,keepproxy,shell,workbench,dispatcher" == *"$i"* ]]; then + if [[ ! "database,balancer,controller,keepstore,websocket,keepweb,workbench2,webshell,keepbalance,keepproxy,shell,workbench,dispatcher,monitoring" == *"$i"* ]]; then echo "The role '${i}' is not a valid role" usage exit 1 fi - ROLES="${ROLES} ${i}" + ROLES="${ROLES:-} ${i}" done shift 2 ;; @@ -141,22 +143,94 @@ copy_custom_cert() { cert_dir=${1} cert_name=${2} - mkdir -p /srv/salt/certs + mkdir -p --mode=0700 /srv/salt/certs if [ -f ${cert_dir}/${cert_name}.crt ]; then - cp -v ${cert_dir}/${cert_name}.crt /srv/salt/certs/arvados-${cert_name}.pem + install --mode=0600 ${cert_dir}/${cert_name}.crt /srv/salt/certs/arvados-${cert_name}.pem else echo "${cert_dir}/${cert_name}.crt does not exist. Exiting" exit 1 fi if [ -f ${cert_dir}/${cert_name}.key ]; then - cp -v ${cert_dir}/${cert_name}.key /srv/salt/certs/arvados-${cert_name}.key + install --mode=0600 ${cert_dir}/${cert_name}.key /srv/salt/certs/arvados-${cert_name}.key else echo "${cert_dir}/${cert_name}.key does not exist. Exiting" exit 1 fi } +apply_var_substitutions() { + local SRCFILE=$1 + local DSTFILE=$2 + sed "s#__ANONYMOUS_USER_TOKEN__#${ANONYMOUS_USER_TOKEN}#g; + s#__BLOB_SIGNING_KEY__#${BLOB_SIGNING_KEY}#g; + s#__CONTROLLER_EXT_SSL_PORT__#${CONTROLLER_EXT_SSL_PORT}#g; + s#__CLUSTER__#${CLUSTER}#g; + s#__DOMAIN__#${DOMAIN}#g; + s#__HOSTNAME_EXT__#${HOSTNAME_EXT}#g; + s#__IP_INT__#${IP_INT}#g; + s#__INITIAL_USER_EMAIL__#${INITIAL_USER_EMAIL}#g; + s#__INITIAL_USER_PASSWORD__#${INITIAL_USER_PASSWORD}#g; + s#__INITIAL_USER__#${INITIAL_USER}#g; + s#__LE_AWS_REGION__#${LE_AWS_REGION:-}#g; + s#__LE_AWS_SECRET_ACCESS_KEY__#${LE_AWS_SECRET_ACCESS_KEY:-}#g; + s#__LE_AWS_ACCESS_KEY_ID__#${LE_AWS_ACCESS_KEY_ID:-}#g; + s#__DATABASE_NAME__#${DATABASE_NAME}#g; + s#__DATABASE_USER__#${DATABASE_USER}#g; + s#__DATABASE_PASSWORD__#${DATABASE_PASSWORD}#g; + s#__DATABASE_INT_IP__#${DATABASE_INT_IP:-}#g; + s#__DATABASE_EXTERNAL_SERVICE_HOST_OR_IP__#${DATABASE_EXTERNAL_SERVICE_HOST_OR_IP:-}#g; + s#__DATABASE_POSTGRESQL_VERSION__#${DATABASE_POSTGRESQL_VERSION}#g; + s#__KEEPWEB_EXT_SSL_PORT__#${KEEPWEB_EXT_SSL_PORT}#g; + s#__KEEP_EXT_SSL_PORT__#${KEEP_EXT_SSL_PORT}#g; + s#__MANAGEMENT_TOKEN__#${MANAGEMENT_TOKEN}#g; + s#__RELEASE__#${RELEASE}#g; + s#__SYSTEM_ROOT_TOKEN__#${SYSTEM_ROOT_TOKEN}#g; + s#__VERSION__#${VERSION}#g; + s#__WEBSHELL_EXT_SSL_PORT__#${WEBSHELL_EXT_SSL_PORT}#g; + s#__WEBSOCKET_EXT_SSL_PORT__#${WEBSOCKET_EXT_SSL_PORT}#g; + s#__WORKBENCH1_EXT_SSL_PORT__#${WORKBENCH1_EXT_SSL_PORT}#g; + s#__WORKBENCH2_EXT_SSL_PORT__#${WORKBENCH2_EXT_SSL_PORT}#g; + s#__CLUSTER_INT_CIDR__#${CLUSTER_INT_CIDR}#g; + s#__CONTROLLER_INT_IP__#${CONTROLLER_INT_IP}#g; + s#__WEBSOCKET_INT_IP__#${WEBSOCKET_INT_IP}#g; + s#__KEEP_INT_IP__#${KEEP_INT_IP}#g; + s#__KEEPSTORE0_INT_IP__#${KEEPSTORE0_INT_IP}#g; + s#__KEEPWEB_INT_IP__#${KEEPWEB_INT_IP}#g; + s#__WEBSHELL_INT_IP__#${WEBSHELL_INT_IP}#g; + s#__SHELL_INT_IP__#${SHELL_INT_IP}#g; + s#__WORKBENCH1_INT_IP__#${WORKBENCH1_INT_IP}#g; + s#__WORKBENCH2_INT_IP__#${WORKBENCH2_INT_IP}#g; + s#__WORKBENCH_SECRET_KEY__#${WORKBENCH_SECRET_KEY}#g; + s#__SSL_KEY_ENCRYPTED__#${SSL_KEY_ENCRYPTED}#g; + s#__SSL_KEY_AWS_REGION__#${SSL_KEY_AWS_REGION:-}#g; + s#__SSL_KEY_AWS_SECRET_NAME__#${SSL_KEY_AWS_SECRET_NAME}#g; + s#__CONTROLLER_MAX_WORKERS__#${CONTROLLER_MAX_WORKERS:-}#g; + s#__CONTROLLER_MAX_QUEUED_REQUESTS__#${CONTROLLER_MAX_QUEUED_REQUESTS:-128}#g; + s#__MONITORING_USERNAME__#${MONITORING_USERNAME}#g; + s#__MONITORING_EMAIL__#${MONITORING_EMAIL}#g; + s#__MONITORING_PASSWORD__#${MONITORING_PASSWORD}#g; + s#__DISPATCHER_SSH_PRIVKEY__#${DISPATCHER_SSH_PRIVKEY//$'\n'/\\n}#g; + s#__ENABLE_BALANCER__#${ENABLE_BALANCER}#g; + s#__DISABLED_CONTROLLER__#${DISABLED_CONTROLLER}#g; + s#__BALANCER_NODENAME__#${ROLE2NODES['balancer']:-}#g; + s#__PROMETHEUS_NODENAME__#${ROLE2NODES['monitoring']:-}#g; + s#__PROMETHEUS_DATA_RETENTION_TIME__#${PROMETHEUS_DATA_RETENTION_TIME:-15d}#g; + s#__CONTROLLER_NODES__#${ROLE2NODES['controller']:-}#g; + s#__NODELIST__#${NODELIST}#g; + s#__DISPATCHER_INT_IP__#${DISPATCHER_INT_IP}#g; + s#__KEEPBALANCE_INT_IP__#${KEEPBALANCE_INT_IP}#g; + s#__COMPUTE_AMI__#${COMPUTE_AMI:-}#g; + s#__COMPUTE_SG__#${COMPUTE_SG:-}#g; + s#__COMPUTE_SUBNET__#${COMPUTE_SUBNET:-}#g; + s#__COMPUTE_AWS_REGION__#${COMPUTE_AWS_REGION:-}#g; + s#__COMPUTE_USER__#${COMPUTE_USER:-}#g; + s#__KEEP_AWS_S3_BUCKET__#${KEEP_AWS_S3_BUCKET:-}#g; + s#__KEEP_AWS_IAM_ROLE__#${KEEP_AWS_IAM_ROLE:-}#g; + s#__KEEP_AWS_REGION__#${KEEP_AWS_REGION:-}#g" \ + "${SRCFILE}" > "${DSTFILE}" +} + DEV_MODE="no" CONFIG_FILE="${SCRIPT_DIR}/local.params" CONFIG_DIR="local_config_dir" @@ -189,7 +263,9 @@ WORKBENCH2_EXT_SSL_PORT=3001 SSL_MODE="self-signed" USE_LETSENCRYPT_ROUTE53="no" -CUSTOM_CERTS_DIR="${SCRIPT_DIR}/certs" +CUSTOM_CERTS_DIR="${SCRIPT_DIR}/local_config_dir/certs" + +GRAFANA_DASHBOARDS_DIR="${SCRIPT_DIR}/local_config_dir/dashboards" ## These are ARVADOS-related parameters # For a stable release, change RELEASE "production" and VERSION to the @@ -206,35 +282,43 @@ VERSION="latest" # ARVADOS_TAG="2.2.0" # BRANCH="main" +# We pin the salt version to avoid potential incompatibilities when a new +# stable version is released. +SALT_VERSION="3004" + # Other formula versions we depend on -POSTGRES_TAG="v0.44.0" +#POSTGRES_TAG="v0.44.0" +#POSTGRES_URL="https://github.com/saltstack-formulas/postgres-formula.git" +POSTGRES_TAG="0.45.0-bugfix327" +POSTGRES_URL="https://github.com/arvados/postgres-formula.git" NGINX_TAG="v2.8.1" DOCKER_TAG="v2.4.2" LOCALE_TAG="v0.3.4" LETSENCRYPT_TAG="v2.1.0" +LOGROTATE_TAG="v0.14.0" +PROMETHEUS_TAG="v5.6.5" +GRAFANA_TAG="v3.1.3" # Salt's dir DUMP_SALT_CONFIG_DIR="" ## states S_DIR="/srv/salt" +STATES_TOP=${S_DIR}/top.sls ## formulas F_DIR="/srv/formulas" ## pillars P_DIR="/srv/pillars" +PILLARS_TOP=${P_DIR}/top.sls ## tests T_DIR="/tmp/cluster_tests" arguments ${@} -if [ -s ${CONFIG_FILE} ]; then - source ${CONFIG_FILE} -else - echo >&2 "You don't seem to have a config file with initial values." - echo >&2 "Please create a '${CONFIG_FILE}' file as described in" - echo >&2 " * https://doc.arvados.org/install/salt-single-host.html#single_host, or" - echo >&2 " * https://doc.arvados.org/install/salt-multi-host.html#multi_host_multi_hostnames" - exit 1 -fi +declare -A NODES +declare -A ROLE2NODES +declare NODELIST + +source common.sh if [ ! -d ${CONFIG_DIR} ]; then echo >&2 "You don't seem to have a config directory with pillars and states." @@ -244,26 +328,26 @@ if [ ! -d ${CONFIG_DIR} ]; then exit 1 fi -if grep -q 'fixme_or_this_wont_work' ${CONFIG_FILE} ; then - echo >&2 "The config file ${CONFIG_FILE} has some parameters that need to be modified." +if grep -rni 'fixme' ${CONFIG_FILE}.secrets ${CONFIG_FILE} ${CONFIG_DIR} ; then + echo >&2 "The config files has some parameters that need to be modified." echo >&2 "Please, fix them and re-run the provision script." exit 1 fi if ! grep -qE '^[[:alnum:]]{5}$' <<<${CLUSTER} ; then - echo >&2 "ERROR: must be exactly 5 alphanumeric characters long" + echo >&2 "ERROR: must be exactly 5 lowercase alphanumeric characters long" echo >&2 "Fix the cluster name in the 'local.params' file and re-run the provision script" exit 1 fi # Only used in single_host/single_name deploys -if [ ! -z "${HOSTNAME_EXT}" ] ; then +if [ ! -z "${HOSTNAME_EXT:-}" ] ; then # We need to add some extra control vars to manage a single certificate vs. multiple USE_SINGLE_HOSTNAME="yes" # Make sure that the value configured as IP_INT is a real IP on the system. # If we don't error out early here when there is a mismatch, the formula will # fail with hard to interpret nginx errors later on. - ip addr list |grep -q " ${IP_INT}/" + ip addr list |grep "${IP_INT}/" >/dev/null if [[ $? -ne 0 ]]; then echo "Unable to find the IP_INT address '${IP_INT}' on the system, please correct the value in local.params. Exiting..." exit 1 @@ -272,7 +356,7 @@ else USE_SINGLE_HOSTNAME="no" # We set this variable, anyway, so sed lines do not fail and we don't need to add more # conditionals - HOSTNAME_EXT="${CLUSTER}.${DOMAIN}" + HOSTNAME_EXT="${DOMAIN}" fi if [ "${DUMP_CONFIG}" = "yes" ]; then @@ -291,7 +375,10 @@ else yum install -y curl git jq ;; "debian"|"ubuntu") - DEBIAN_FRONTEND=noninteractive apt update + # Wait 2 minutes for any apt locks to clear + # This option is supported from apt 1.9.1 and ignored in older apt versions. + # Cf. https://blog.sinjakli.co.uk/2021/10/25/waiting-for-apt-locks-without-the-hacky-bash-scripts/ + DEBIAN_FRONTEND=noninteractive apt -o DPkg::Lock::Timeout=120 update DEBIAN_FRONTEND=noninteractive apt install -y curl git jq ;; esac @@ -300,7 +387,7 @@ else echo "Salt already installed" else curl -L https://bootstrap.saltstack.com -o /tmp/bootstrap_salt.sh - sh /tmp/bootstrap_salt.sh -XdfP -x python3 + sh /tmp/bootstrap_salt.sh -XdfP -x python3 old-stable ${SALT_VERSION} /bin/systemctl stop salt-minion.service /bin/systemctl disable salt-minion.service fi @@ -326,43 +413,64 @@ mkdir -p ${S_DIR} ${F_DIR} ${P_DIR} ${T_DIR} # Get the formula and dependencies cd ${F_DIR} || exit 1 echo "Cloning formulas" -rm -rf ${F_DIR}/* || exit 1 -git clone --quiet https://github.com/saltstack-formulas/docker-formula.git ${F_DIR}/docker -( cd docker && git checkout --quiet tags/"${DOCKER_TAG}" -b "${DOCKER_TAG}" ) +test -d docker && ( cd docker && git fetch ) \ + || git clone --quiet https://github.com/saltstack-formulas/docker-formula.git ${F_DIR}/docker +( cd docker && git checkout --quiet tags/"${DOCKER_TAG}" ) echo "...locale" -git clone --quiet https://github.com/saltstack-formulas/locale-formula.git ${F_DIR}/locale -( cd locale && git checkout --quiet tags/"${LOCALE_TAG}" -b "${LOCALE_TAG}" ) +test -d locale && ( cd locale && git fetch ) \ + || git clone --quiet https://github.com/saltstack-formulas/locale-formula.git ${F_DIR}/locale +( cd locale && git checkout --quiet tags/"${LOCALE_TAG}" ) echo "...nginx" -git clone --quiet https://github.com/saltstack-formulas/nginx-formula.git ${F_DIR}/nginx -( cd nginx && git checkout --quiet tags/"${NGINX_TAG}" -b "${NGINX_TAG}" ) +test -d nginx && ( cd nginx && git fetch ) \ + || git clone --quiet https://github.com/saltstack-formulas/nginx-formula.git ${F_DIR}/nginx +( cd nginx && git checkout --quiet tags/"${NGINX_TAG}" ) echo "...postgres" -git clone --quiet https://github.com/saltstack-formulas/postgres-formula.git ${F_DIR}/postgres -( cd postgres && git checkout --quiet tags/"${POSTGRES_TAG}" -b "${POSTGRES_TAG}" ) +test -d postgres && ( cd postgres && git fetch ) \ + || git clone --quiet ${POSTGRES_URL} ${F_DIR}/postgres +( cd postgres && git checkout --quiet tags/"${POSTGRES_TAG}" ) + +echo "...prometheus" +test -d prometheus && ( cd prometheus && git fetch ) \ + || git clone --quiet https://github.com/saltstack-formulas/prometheus-formula.git ${F_DIR}/prometheus +( cd prometheus && git checkout --quiet tags/"${PROMETHEUS_TAG}" ) + +echo "...grafana" +test -d grafana && ( cd grafana && git fetch ) \ + || git clone --quiet https://github.com/saltstack-formulas/grafana-formula.git ${F_DIR}/grafana +( cd grafana && git checkout --quiet "${GRAFANA_TAG}" ) echo "...letsencrypt" -git clone --quiet https://github.com/saltstack-formulas/letsencrypt-formula.git ${F_DIR}/letsencrypt -( cd letsencrypt && git checkout --quiet tags/"${LETSENCRYPT_TAG}" -b "${LETSENCRYPT_TAG}" ) +test -d letsencrypt && ( cd letsencrypt && git fetch ) \ + || git clone --quiet https://github.com/saltstack-formulas/letsencrypt-formula.git ${F_DIR}/letsencrypt +( cd letsencrypt && git checkout --quiet tags/"${LETSENCRYPT_TAG}" ) + +echo "...logrotate" +test -d logrotate && ( cd logrotate && git fetch ) \ + || git clone --quiet https://github.com/saltstack-formulas/logrotate-formula.git ${F_DIR}/logrotate +( cd logrotate && git checkout --quiet tags/"${LOGROTATE_TAG}" ) echo "...arvados" -git clone --quiet https://git.arvados.org/arvados-formula.git ${F_DIR}/arvados +test -d arvados || git clone --quiet https://git.arvados.org/arvados-formula.git ${F_DIR}/arvados # If we want to try a specific branch of the formula -if [ "x${BRANCH}" != "x" ]; then +if [[ ! -z "${BRANCH:-}" && "x${BRANCH}" != "xmain" ]]; then ( cd ${F_DIR}/arvados && git checkout --quiet -t origin/"${BRANCH}" -b "${BRANCH}" ) -elif [ "x${ARVADOS_TAG}" != "x" ]; then -( cd ${F_DIR}/arvados && git checkout --quiet tags/"${ARVADOS_TAG}" -b "${ARVADOS_TAG}" ) +elif [ "x${ARVADOS_TAG:-}" != "x" ]; then + ( cd ${F_DIR}/arvados && git checkout --quiet tags/"${ARVADOS_TAG}" -b "${ARVADOS_TAG}" ) fi -if [ "x${VAGRANT}" = "xyes" ]; then +if [ "x${VAGRANT:-}" = "xyes" ]; then EXTRA_STATES_DIR="/home/vagrant/${CONFIG_DIR}/states" SOURCE_PILLARS_DIR="/home/vagrant/${CONFIG_DIR}/pillars" + SOURCE_TOFS_DIR="/home/vagrant/${CONFIG_DIR}/tofs" SOURCE_TESTS_DIR="/home/vagrant/${TESTS_DIR}" else EXTRA_STATES_DIR="${SCRIPT_DIR}/${CONFIG_DIR}/states" SOURCE_PILLARS_DIR="${SCRIPT_DIR}/${CONFIG_DIR}/pillars" + SOURCE_TOFS_DIR="${SCRIPT_DIR}/${CONFIG_DIR}/tofs" SOURCE_TESTS_DIR="${SCRIPT_DIR}/${TESTS_DIR}" fi @@ -377,111 +485,45 @@ if [ ! -d "${SOURCE_PILLARS_DIR}" ]; then exit 1 fi for f in $(ls "${SOURCE_PILLARS_DIR}"/*); do - sed "s#__ANONYMOUS_USER_TOKEN__#${ANONYMOUS_USER_TOKEN}#g; - s#__BLOB_SIGNING_KEY__#${BLOB_SIGNING_KEY}#g; - s#__CONTROLLER_EXT_SSL_PORT__#${CONTROLLER_EXT_SSL_PORT}#g; - s#__CLUSTER__#${CLUSTER}#g; - s#__DOMAIN__#${DOMAIN}#g; - s#__HOSTNAME_EXT__#${HOSTNAME_EXT}#g; - s#__IP_INT__#${IP_INT}#g; - s#__INITIAL_USER_EMAIL__#${INITIAL_USER_EMAIL}#g; - s#__INITIAL_USER_PASSWORD__#${INITIAL_USER_PASSWORD}#g; - s#__INITIAL_USER__#${INITIAL_USER}#g; - s#__LE_AWS_REGION__#${LE_AWS_REGION}#g; - s#__LE_AWS_SECRET_ACCESS_KEY__#${LE_AWS_SECRET_ACCESS_KEY}#g; - s#__LE_AWS_ACCESS_KEY_ID__#${LE_AWS_ACCESS_KEY_ID}#g; - s#__DATABASE_PASSWORD__#${DATABASE_PASSWORD}#g; - s#__KEEPWEB_EXT_SSL_PORT__#${KEEPWEB_EXT_SSL_PORT}#g; - s#__KEEP_EXT_SSL_PORT__#${KEEP_EXT_SSL_PORT}#g; - s#__MANAGEMENT_TOKEN__#${MANAGEMENT_TOKEN}#g; - s#__RELEASE__#${RELEASE}#g; - s#__SYSTEM_ROOT_TOKEN__#${SYSTEM_ROOT_TOKEN}#g; - s#__VERSION__#${VERSION}#g; - s#__WEBSHELL_EXT_SSL_PORT__#${WEBSHELL_EXT_SSL_PORT}#g; - s#__WEBSOCKET_EXT_SSL_PORT__#${WEBSOCKET_EXT_SSL_PORT}#g; - s#__WORKBENCH1_EXT_SSL_PORT__#${WORKBENCH1_EXT_SSL_PORT}#g; - s#__WORKBENCH2_EXT_SSL_PORT__#${WORKBENCH2_EXT_SSL_PORT}#g; - s#__CLUSTER_INT_CIDR__#${CLUSTER_INT_CIDR}#g; - s#__CONTROLLER_INT_IP__#${CONTROLLER_INT_IP}#g; - s#__WEBSOCKET_INT_IP__#${WEBSOCKET_INT_IP}#g; - s#__KEEP_INT_IP__#${KEEP_INT_IP}#g; - s#__KEEPSTORE0_INT_IP__#${KEEPSTORE0_INT_IP}#g; - s#__KEEPSTORE1_INT_IP__#${KEEPSTORE1_INT_IP}#g; - s#__KEEPWEB_INT_IP__#${KEEPWEB_INT_IP}#g; - s#__WEBSHELL_INT_IP__#${WEBSHELL_INT_IP}#g; - s#__SHELL_INT_IP__#${SHELL_INT_IP}#g; - s#__WORKBENCH1_INT_IP__#${WORKBENCH1_INT_IP}#g; - s#__WORKBENCH2_INT_IP__#${WORKBENCH2_INT_IP}#g; - s#__DATABASE_INT_IP__#${DATABASE_INT_IP}#g; - s#__WORKBENCH_SECRET_KEY__#${WORKBENCH_SECRET_KEY}#g" \ - "${f}" > "${P_DIR}"/$(basename "${f}") + apply_var_substitutions "${f}" "${P_DIR}"/$(basename "${f}") done -if [ "x${TEST}" = "xyes" ] && [ ! -d "${SOURCE_TESTS_DIR}" ]; then - echo "You requested to run tests, but ${SOURCE_TESTS_DIR} does not exist or is not a directory. Exiting." - exit 1 -fi -mkdir -p ${T_DIR} -# Replace cluster and domain name in the test files -for f in $(ls "${SOURCE_TESTS_DIR}"/*); do - FILTERS="s#__CLUSTER__#${CLUSTER}#g; - s#__CONTROLLER_EXT_SSL_PORT__#${CONTROLLER_EXT_SSL_PORT}#g; - s#__DOMAIN__#${DOMAIN}#g; - s#__IP_INT__#${IP_INT}#g; - s#__INITIAL_USER_EMAIL__#${INITIAL_USER_EMAIL}#g; - s#__INITIAL_USER_PASSWORD__#${INITIAL_USER_PASSWORD}#g - s#__INITIAL_USER__#${INITIAL_USER}#g; - s#__DATABASE_PASSWORD__#${DATABASE_PASSWORD}#g; - s#__SYSTEM_ROOT_TOKEN__#${SYSTEM_ROOT_TOKEN}#g" - if [ "$USE_SINGLE_HOSTNAME" = "yes" ]; then - FILTERS="s#__CLUSTER__.__DOMAIN__#${HOSTNAME_EXT}#g; - $FILTERS" +if [ ! -d "${SOURCE_TESTS_DIR}" ]; then + echo "WARNING: The tests directory was not copied to \"${SOURCE_TESTS_DIR}\"." + if [ "x${TEST:-}" = "xyes" ]; then + echo "WARNING: Disabling tests for this installation." fi - sed "$FILTERS" \ - "${f}" > ${T_DIR}/$(basename "${f}") -done -chmod 755 ${T_DIR}/run-test.sh - -# Replace helper state files that differ from the formula's examples -if [ -d "${SOURCE_STATES_DIR}" ]; then - mkdir -p "${F_DIR}"/extra/extra - - for f in $(ls "${SOURCE_STATES_DIR}"/*); do - sed "s#__ANONYMOUS_USER_TOKEN__#${ANONYMOUS_USER_TOKEN}#g; - s#__CLUSTER__#${CLUSTER}#g; - s#__BLOB_SIGNING_KEY__#${BLOB_SIGNING_KEY}#g; + TEST="no" +else + mkdir -p ${T_DIR} + # Replace cluster and domain name in the test files + for f in $(ls "${SOURCE_TESTS_DIR}"/*); do + FILTERS="s#__CLUSTER__#${CLUSTER}#g; s#__CONTROLLER_EXT_SSL_PORT__#${CONTROLLER_EXT_SSL_PORT}#g; s#__DOMAIN__#${DOMAIN}#g; - s#__HOSTNAME_EXT__#${HOSTNAME_EXT}#g; s#__IP_INT__#${IP_INT}#g; s#__INITIAL_USER_EMAIL__#${INITIAL_USER_EMAIL}#g; - s#__INITIAL_USER_PASSWORD__#${INITIAL_USER_PASSWORD}#g; + s#__INITIAL_USER_PASSWORD__#${INITIAL_USER_PASSWORD}#g s#__INITIAL_USER__#${INITIAL_USER}#g; s#__DATABASE_PASSWORD__#${DATABASE_PASSWORD}#g; - s#__KEEPWEB_EXT_SSL_PORT__#${KEEPWEB_EXT_SSL_PORT}#g; - s#__KEEP_EXT_SSL_PORT__#${KEEP_EXT_SSL_PORT}#g; - s#__MANAGEMENT_TOKEN__#${MANAGEMENT_TOKEN}#g; - s#__RELEASE__#${RELEASE}#g; - s#__SYSTEM_ROOT_TOKEN__#${SYSTEM_ROOT_TOKEN}#g; - s#__VERSION__#${VERSION}#g; - s#__CLUSTER_INT_CIDR__#${CLUSTER_INT_CIDR}#g; - s#__CONTROLLER_INT_IP__#${CONTROLLER_INT_IP}#g; - s#__WEBSOCKET_INT_IP__#${WEBSOCKET_INT_IP}#g; - s#__KEEP_INT_IP__#${KEEP_INT_IP}#g; - s#__KEEPSTORE0_INT_IP__#${KEEPSTORE0_INT_IP}#g; - s#__KEEPSTORE1_INT_IP__#${KEEPSTORE1_INT_IP}#g; - s#__KEEPWEB_INT_IP__#${KEEPWEB_INT_IP}#g; - s#__WEBSHELL_INT_IP__#${WEBSHELL_INT_IP}#g; - s#__WORKBENCH1_INT_IP__#${WORKBENCH1_INT_IP}#g; - s#__WORKBENCH2_INT_IP__#${WORKBENCH2_INT_IP}#g; - s#__DATABASE_INT_IP__#${DATABASE_INT_IP}#g; - s#__WEBSHELL_EXT_SSL_PORT__#${WEBSHELL_EXT_SSL_PORT}#g; - s#__SHELL_INT_IP__#${SHELL_INT_IP}#g; - s#__WEBSOCKET_EXT_SSL_PORT__#${WEBSOCKET_EXT_SSL_PORT}#g; - s#__WORKBENCH1_EXT_SSL_PORT__#${WORKBENCH1_EXT_SSL_PORT}#g; - s#__WORKBENCH2_EXT_SSL_PORT__#${WORKBENCH2_EXT_SSL_PORT}#g; - s#__WORKBENCH_SECRET_KEY__#${WORKBENCH_SECRET_KEY}#g" \ - "${f}" > "${F_DIR}/extra/extra"/$(basename "${f}") + s#__SYSTEM_ROOT_TOKEN__#${SYSTEM_ROOT_TOKEN}#g" + if [ "$USE_SINGLE_HOSTNAME" = "yes" ]; then + FILTERS="s#__CLUSTER__.__DOMAIN__#${HOSTNAME_EXT}#g; + $FILTERS" + fi + sed "$FILTERS" \ + "${f}" > ${T_DIR}/$(basename "${f}") + done + chmod 755 ${T_DIR}/run-test.sh +fi + +# Replace helper state files that differ from the formula's examples +if [ -d "${SOURCE_STATES_DIR}" ]; then + mkdir -p "${F_DIR}"/extra/extra + rm -rf "${F_DIR}"/extra/extra/* + + for f in $(ls "${SOURCE_STATES_DIR}"/*); do + apply_var_substitutions "${f}" "${F_DIR}/extra/extra"/$(basename "${f}") done fi @@ -489,15 +531,21 @@ fi # As we need to separate both states and pillars in case we want specific # roles, we iterate on both at the same time +# Formula template overrides (TOFS) +# See: https://template-formula.readthedocs.io/en/latest/TOFS_pattern.html#template-override +if [ -d ${SOURCE_TOFS_DIR} ]; then + find ${SOURCE_TOFS_DIR} -mindepth 1 -maxdepth 1 -type d -exec cp -r "{}" ${S_DIR} \; +fi + # States -cat > ${S_DIR}/top.sls << EOFTSLS +cat > ${STATES_TOP} << EOFTSLS base: '*': - locale EOFTSLS # Pillars -cat > ${P_DIR}/top.sls << EOFPSLS +cat > ${PILLARS_TOP} << EOFPSLS base: '*': - locale @@ -514,8 +562,8 @@ if [ -d "${F_DIR}"/extra/extra ]; then # Same when using self-signed certificates. SKIP_SNAKE_OIL="dont_add_snakeoil_certs" fi - for f in $(ls "${F_DIR}"/extra/extra/*.sls | grep -v ${SKIP_SNAKE_OIL}); do - echo " - extra.$(basename ${f} | sed 's/.sls$//g')" >> ${S_DIR}/top.sls + for f in $(ls "${F_DIR}"/extra/extra/*.sls | egrep -v "${SKIP_SNAKE_OIL}|shell_"); do + echo " - extra.$(basename ${f} | sed 's/.sls$//g')" >> ${STATES_TOP} done # Use byo or self-signed certificates if [ "${SSL_MODE}" != "lets-encrypt" ]; then @@ -525,41 +573,51 @@ fi # If we want specific roles for a node, just add the desired states # and its dependencies -if [ -z "${ROLES}" ]; then +if [ -z "${ROLES:-}" ]; then # States - echo " - nginx.passenger" >> ${S_DIR}/top.sls + echo " - nginx.passenger" >> ${STATES_TOP} if [ "${SSL_MODE}" = "lets-encrypt" ]; then if [ "${USE_LETSENCRYPT_ROUTE53}" = "yes" ]; then - grep -q "aws_credentials" ${S_DIR}/top.sls || echo " - extra.aws_credentials" >> ${S_DIR}/top.sls + grep -q "aws_credentials" ${STATES_TOP} || echo " - extra.aws_credentials" >> ${STATES_TOP} fi - grep -q "letsencrypt" ${S_DIR}/top.sls || echo " - letsencrypt" >> ${S_DIR}/top.sls + grep -q "letsencrypt" ${STATES_TOP} || echo " - letsencrypt" >> ${STATES_TOP} else - # Use custom certs, as both bring-your-own and self-signed are copied using this state - # Copy certs to formula extra/files - # In dev mode, the files will be created and put in the destination directory by the - # snakeoil_certs.sls state file - mkdir -p /srv/salt/certs - cp -rv ${CUSTOM_CERTS_DIR}/* /srv/salt/certs/ - # We add the custom_certs state - grep -q "custom_certs" ${S_DIR}/top.sls || echo " - extra.custom_certs" >> ${S_DIR}/top.sls + mkdir -p --mode=0700 /srv/salt/certs + if [ "${SSL_MODE}" = "bring-your-own" ]; then + # Copy certs to formula extra/files + install --mode=0600 ${CUSTOM_CERTS_DIR}/* /srv/salt/certs/ + # We add the custom_certs state + grep -q "custom_certs" ${STATES_TOP} || echo " - extra.custom_certs" >> ${STATES_TOP} + if [ "${SSL_KEY_ENCRYPTED}" = "yes" ]; then + grep -q "ssl_key_encrypted" ${STATES_TOP} || echo " - extra.ssl_key_encrypted" >> ${STATES_TOP} + fi + fi + # In self-signed mode, the certificate files will be created and put in the + # destination directory by the snakeoil_certs.sls state file fi - echo " - postgres" >> ${S_DIR}/top.sls - echo " - docker.software" >> ${S_DIR}/top.sls - echo " - arvados" >> ${S_DIR}/top.sls + echo " - postgres" >> ${STATES_TOP} + echo " - logrotate" >> ${STATES_TOP} + echo " - docker.software" >> ${STATES_TOP} + echo " - arvados" >> ${STATES_TOP} + echo " - extra.shell_sudo_passwordless" >> ${STATES_TOP} + echo " - extra.shell_cron_add_login_sync" >> ${STATES_TOP} + echo " - extra.passenger_rvm" >> ${STATES_TOP} # Pillars - echo " - docker" >> ${P_DIR}/top.sls - echo " - nginx_api_configuration" >> ${P_DIR}/top.sls - echo " - nginx_controller_configuration" >> ${P_DIR}/top.sls - echo " - nginx_keepproxy_configuration" >> ${P_DIR}/top.sls - echo " - nginx_keepweb_configuration" >> ${P_DIR}/top.sls - echo " - nginx_passenger" >> ${P_DIR}/top.sls - echo " - nginx_websocket_configuration" >> ${P_DIR}/top.sls - echo " - nginx_webshell_configuration" >> ${P_DIR}/top.sls - echo " - nginx_workbench2_configuration" >> ${P_DIR}/top.sls - echo " - nginx_workbench_configuration" >> ${P_DIR}/top.sls - echo " - postgresql" >> ${P_DIR}/top.sls + echo " - docker" >> ${PILLARS_TOP} + echo " - nginx_api_configuration" >> ${PILLARS_TOP} + echo " - logrotate_api" >> ${PILLARS_TOP} + echo " - nginx_controller_configuration" >> ${PILLARS_TOP} + echo " - nginx_keepproxy_configuration" >> ${PILLARS_TOP} + echo " - nginx_keepweb_configuration" >> ${PILLARS_TOP} + echo " - nginx_passenger" >> ${PILLARS_TOP} + echo " - nginx_websocket_configuration" >> ${PILLARS_TOP} + echo " - nginx_webshell_configuration" >> ${PILLARS_TOP} + echo " - nginx_workbench2_configuration" >> ${PILLARS_TOP} + echo " - nginx_workbench_configuration" >> ${PILLARS_TOP} + echo " - logrotate_wb1" >> ${PILLARS_TOP} + echo " - postgresql" >> ${PILLARS_TOP} # We need to tweak the Nginx's pillar depending whether we want plan nginx or nginx+passenger NGINX_INSTALL_SOURCE="install_from_phusionpassenger" @@ -567,20 +625,36 @@ if [ -z "${ROLES}" ]; then if [ "${SSL_MODE}" = "lets-encrypt" ]; then if [ "${USE_LETSENCRYPT_ROUTE53}" = "yes" ]; then - grep -q "aws_credentials" ${P_DIR}/top.sls || echo " - aws_credentials" >> ${P_DIR}/top.sls + grep -q "aws_credentials" ${PILLARS_TOP} || echo " - aws_credentials" >> ${PILLARS_TOP} + fi + grep -q "letsencrypt" ${PILLARS_TOP} || echo " - letsencrypt" >> ${PILLARS_TOP} + + hosts=("controller" "websocket" "workbench" "workbench2" "webshell" "keepproxy") + if [ ${USE_SINGLE_HOSTNAME} = "no" ]; then + hosts+=("download" "collections") + else + hosts+=("keepweb") fi - grep -q "letsencrypt" ${P_DIR}/top.sls || echo " - letsencrypt" >> ${P_DIR}/top.sls - # As the pillar differ whether we use LE or custom certs, we need to do a final edition on them - for c in controller websocket workbench workbench2 webshell download collections keepproxy; do - sed -i "s/__CERT_REQUIRES__/cmd: create-initial-cert-${c}.${CLUSTER}.${DOMAIN}*/g; - s#__CERT_PEM__#/etc/letsencrypt/live/${c}.${CLUSTER}.${DOMAIN}/fullchain.pem#g; - s#__CERT_KEY__#/etc/letsencrypt/live/${c}.${CLUSTER}.${DOMAIN}/privkey.pem#g" \ + for c in "${hosts[@]}"; do + # Are we in a single-host-single-hostname env? + if [ "${USE_SINGLE_HOSTNAME}" = "yes" ]; then + # Are we in a single-host-single-hostname env? + CERT_NAME=${HOSTNAME_EXT} + else + # We are in a multiple-hostnames env + CERT_NAME=${c}.${DOMAIN} + fi + + # As the pillar differs whether we use LE or custom certs, we need to do a final edition on them + sed -i "s/__CERT_REQUIRES__/cmd: create-initial-cert-${CERT_NAME}*/g; + s#__CERT_PEM__#/etc/letsencrypt/live/${CERT_NAME}/fullchain.pem#g; + s#__CERT_KEY__#/etc/letsencrypt/live/${CERT_NAME}/privkey.pem#g" \ ${P_DIR}/nginx_${c}_configuration.sls done else # Use custom certs (either dev mode or prod) - grep -q "extra_custom_certs" ${P_DIR}/top.sls || echo " - extra_custom_certs" >> ${P_DIR}/top.sls + grep -q "extra_custom_certs" ${PILLARS_TOP} || echo " - extra_custom_certs" >> ${PILLARS_TOP} # And add the certs in the custom_certs pillar echo "extra_custom_certs_dir: /srv/salt/certs" > ${P_DIR}/extra_custom_certs.sls echo "extra_custom_certs:" >> ${P_DIR}/extra_custom_certs.sls @@ -602,7 +676,7 @@ if [ -z "${ROLES}" ]; then grep -q ${CERT_NAME} ${P_DIR}/extra_custom_certs.sls || echo " - ${CERT_NAME}" >> ${P_DIR}/extra_custom_certs.sls # As the pillar differs whether we use LE or custom certs, we need to do a final edition on them - sed -i "s/__CERT_REQUIRES__/file: extra_custom_certs_file_copy_arvados-${CERT_NAME}.pem/g; + sed -i "s/__CERT_REQUIRES__/file: extra_custom_certs_${CERT_NAME}_cert_file_copy/g; s#__CERT_PEM__#/etc/nginx/ssl/arvados-${CERT_NAME}.pem#g; s#__CERT_KEY__#/etc/nginx/ssl/arvados-${CERT_NAME}.key#g" \ ${P_DIR}/nginx_${c}_configuration.sls @@ -610,77 +684,212 @@ if [ -z "${ROLES}" ]; then fi else # If we add individual roles, make sure we add the repo first - echo " - arvados.repo" >> ${S_DIR}/top.sls + echo " - arvados.repo" >> ${STATES_TOP} # We add the extra_custom_certs state - grep -q "extra.custom_certs" ${S_DIR}/top.sls || echo " - extra.custom_certs" >> ${S_DIR}/top.sls + grep -q "extra.custom_certs" ${STATES_TOP} || echo " - extra.custom_certs" >> ${STATES_TOP} + if [ "${SSL_KEY_ENCRYPTED}" = "yes" ]; then + grep -q "ssl_key_encrypted" ${STATES_TOP} || echo " - extra.ssl_key_encrypted" >> ${STATES_TOP} + fi # And we add the basic part for the certs pillar if [ "${SSL_MODE}" != "lets-encrypt" ]; then # And add the certs in the custom_certs pillar echo "extra_custom_certs_dir: /srv/salt/certs" > ${P_DIR}/extra_custom_certs.sls echo "extra_custom_certs:" >> ${P_DIR}/extra_custom_certs.sls - grep -q "extra_custom_certs" ${P_DIR}/top.sls || echo " - extra_custom_certs" >> ${P_DIR}/top.sls + grep -q "extra_custom_certs" ${PILLARS_TOP} || echo " - extra_custom_certs" >> ${PILLARS_TOP} fi - for R in ${ROLES}; do + # Prometheus state on all nodes due to the node exporter below + grep -q "\- prometheus$" ${STATES_TOP} || echo " - prometheus" >> ${STATES_TOP} + # Prometheus node exporter pillar + grep -q "prometheus_node_exporter" ${PILLARS_TOP} || echo " - prometheus_node_exporter" >> ${PILLARS_TOP} + + for R in ${ROLES:-}; do case "${R}" in "database") # States - echo " - postgres" >> ${S_DIR}/top.sls + grep -q "\- postgres$" ${STATES_TOP} || echo " - postgres" >> ${STATES_TOP} + grep -q "extra.prometheus_pg_exporter" ${STATES_TOP} || echo " - extra.prometheus_pg_exporter" >> ${STATES_TOP} # Pillars - echo ' - postgresql' >> ${P_DIR}/top.sls + grep -q "postgresql" ${PILLARS_TOP} || echo " - postgresql" >> ${PILLARS_TOP} + grep -q "prometheus_pg_exporter" ${PILLARS_TOP} || echo " - prometheus_pg_exporter" >> ${PILLARS_TOP} ;; - "api") - # States - # FIXME: https://dev.arvados.org/issues/17352 - grep -q "postgres.client" ${S_DIR}/top.sls || echo " - postgres.client" >> ${S_DIR}/top.sls - if grep -q " - nginx.*$" ${S_DIR}/top.sls; then - sed -i s/"^ - nginx.*$"/" - nginx.passenger"/g ${S_DIR}/top.sls - else - echo " - nginx.passenger" >> ${S_DIR}/top.sls + "monitoring") + ### Support files ### + GRAFANA_DASHBOARDS_DEST_DIR=/srv/salt/dashboards + mkdir -p "${GRAFANA_DASHBOARDS_DEST_DIR}" + rm -f "${GRAFANA_DASHBOARDS_DEST_DIR}"/* + # "ArvadosPromDataSource" is the hardcoded UID for Prometheus' datasource + # in Grafana. + for f in $(ls "${GRAFANA_DASHBOARDS_DIR}"/*.json); do + sed 's#${DS_PROMETHEUS}#ArvadosPromDataSource#g' \ + "${f}" > "${GRAFANA_DASHBOARDS_DEST_DIR}"/$(basename "${f}") + done + + ### States ### + grep -q "\- nginx$" ${STATES_TOP} || echo " - nginx" >> ${STATES_TOP} + grep -q "extra.nginx_prometheus_configuration" ${STATES_TOP} || echo " - extra.nginx_prometheus_configuration" >> ${STATES_TOP} + + grep -q "\- grafana$" ${STATES_TOP} || echo " - grafana" >> ${STATES_TOP} + grep -q "extra.grafana_datasource" ${STATES_TOP} || echo " - extra.grafana_datasource" >> ${STATES_TOP} + grep -q "extra.grafana_dashboards" ${STATES_TOP} || echo " - extra.grafana_dashboards" >> ${STATES_TOP} + grep -q "extra.grafana_admin_user" ${STATES_TOP} || echo " - extra.grafana_admin_user" >> ${STATES_TOP} + + if [ "${SSL_MODE}" = "lets-encrypt" ]; then + grep -q "letsencrypt" ${STATES_TOP} || echo " - letsencrypt" >> ${STATES_TOP} + if [ "x${USE_LETSENCRYPT_ROUTE53:-}" = "xyes" ]; then + grep -q "aws_credentials" ${STATES_TOP} || echo " - aws_credentials" >> ${STATES_TOP} + fi + elif [ "${SSL_MODE}" = "bring-your-own" ]; then + for SVC in grafana prometheus; do + copy_custom_cert ${CUSTOM_CERTS_DIR} ${SVC} + done fi - ### If we don't install and run LE before arvados-api-server, it fails and breaks everything - ### after it. So we add this here as we are, after all, sharing the host for api and controller + ### Pillars ### + grep -q "prometheus_server" ${PILLARS_TOP} || echo " - prometheus_server" >> ${PILLARS_TOP} + grep -q "grafana" ${PILLARS_TOP} || echo " - grafana" >> ${PILLARS_TOP} + for SVC in grafana prometheus; do + grep -q "nginx_${SVC}_configuration" ${PILLARS_TOP} || echo " - nginx_${SVC}_configuration" >> ${PILLARS_TOP} + done if [ "${SSL_MODE}" = "lets-encrypt" ]; then + grep -q "letsencrypt" ${PILLARS_TOP} || echo " - letsencrypt" >> ${PILLARS_TOP} + for SVC in grafana prometheus; do + grep -q "letsencrypt_${SVC}_configuration" ${PILLARS_TOP} || echo " - letsencrypt_${SVC}_configuration" >> ${PILLARS_TOP} + sed -i "s/__CERT_REQUIRES__/cmd: create-initial-cert-${SVC}.${DOMAIN}*/g; + s#__CERT_PEM__#/etc/letsencrypt/live/${SVC}.${DOMAIN}/fullchain.pem#g; + s#__CERT_KEY__#/etc/letsencrypt/live/${SVC}.${DOMAIN}/privkey.pem#g" \ + ${P_DIR}/nginx_${SVC}_configuration.sls + done if [ "${USE_LETSENCRYPT_ROUTE53}" = "yes" ]; then - grep -q "aws_credentials" ${S_DIR}/top.sls || echo " - aws_credentials" >> ${S_DIR}/top.sls + grep -q "aws_credentials" ${PILLARS_TOP} || echo " - aws_credentials" >> ${PILLARS_TOP} fi - grep -q "letsencrypt" ${S_DIR}/top.sls || echo " - letsencrypt" >> ${S_DIR}/top.sls + elif [ "${SSL_MODE}" = "bring-your-own" ]; then + grep -q "ssl_key_encrypted" ${PILLARS_TOP} || echo " - ssl_key_encrypted" >> ${PILLARS_TOP} + for SVC in grafana prometheus; do + sed -i "s/__CERT_REQUIRES__/file: extra_custom_certs_${SVC}_cert_file_copy/g; + s#__CERT_PEM__#/etc/nginx/ssl/arvados-${SVC}.pem#g; + s#__CERT_KEY__#/etc/nginx/ssl/arvados-${SVC}.key#g" \ + ${P_DIR}/nginx_${SVC}_configuration.sls + grep -q ${SVC} ${P_DIR}/extra_custom_certs.sls || echo " - ${SVC}" >> ${P_DIR}/extra_custom_certs.sls + done + fi + ;; + "balancer") + ### States ### + grep -q "\- nginx$" ${STATES_TOP} || echo " - nginx" >> ${STATES_TOP} + + if [ "${SSL_MODE}" = "lets-encrypt" ]; then + grep -q "letsencrypt" ${STATES_TOP} || echo " - letsencrypt" >> ${STATES_TOP} + if [ "x${USE_LETSENCRYPT_ROUTE53:-}" = "xyes" ]; then + grep -q "aws_credentials" ${STATES_TOP} || echo " - aws_credentials" >> ${STATES_TOP} + fi + elif [ "${SSL_MODE}" = "bring-your-own" ]; then + copy_custom_cert ${CUSTOM_CERTS_DIR} ${R} + fi + + ### Pillars ### + grep -q "nginx_${R}_configuration" ${PILLARS_TOP} || echo " - nginx_${R}_configuration" >> ${PILLARS_TOP} + + if [ "${SSL_MODE}" = "lets-encrypt" ]; then + grep -q "letsencrypt" ${PILLARS_TOP} || echo " - letsencrypt" >> ${PILLARS_TOP} + + grep -q "letsencrypt_${R}_configuration" ${PILLARS_TOP} || echo " - letsencrypt_${R}_configuration" >> ${PILLARS_TOP} + sed -i "s/__CERT_REQUIRES__/cmd: create-initial-cert-${ROLE2NODES['balancer']}*/g; + s#__CERT_PEM__#/etc/letsencrypt/live/${ROLE2NODES['balancer']}/fullchain.pem#g; + s#__CERT_KEY__#/etc/letsencrypt/live/${ROLE2NODES['balancer']}/privkey.pem#g" \ + ${P_DIR}/nginx_${R}_configuration.sls + + if [ "${USE_LETSENCRYPT_ROUTE53}" = "yes" ]; then + grep -q "aws_credentials" ${PILLARS_TOP} || echo " - aws_credentials" >> ${PILLARS_TOP} + fi + elif [ "${SSL_MODE}" = "bring-your-own" ]; then + grep -q "ssl_key_encrypted" ${PILLARS_TOP} || echo " - ssl_key_encrypted" >> ${PILLARS_TOP} + sed -i "s/__CERT_REQUIRES__/file: extra_custom_certs_${R}_cert_file_copy/g; + s#__CERT_PEM__#/etc/nginx/ssl/arvados-${R}.pem#g; + s#__CERT_KEY__#/etc/nginx/ssl/arvados-${R}.key#g" \ + ${P_DIR}/nginx_${R}_configuration.sls + grep -q "${R}" ${P_DIR}/extra_custom_certs.sls || echo " - ${R}" >> ${P_DIR}/extra_custom_certs.sls + fi + ;; + "controller") + ### States ### + grep -q " - logrotate" ${STATES_TOP} || echo " - logrotate" >> ${STATES_TOP} + if grep -q " - nginx.*$" ${STATES_TOP}; then + sed -i s/"^ - nginx.*$"/" - nginx.passenger"/g ${STATES_TOP} else - # Use custom certs - if [ "${SSL_MODE}" = "bring-your-own" ]; then - copy_custom_cert ${CUSTOM_CERTS_DIR} controller + echo " - nginx.passenger" >> ${STATES_TOP} + fi + echo " - extra.passenger_rvm" >> ${STATES_TOP} + grep -q "^ - postgres\\.client$" ${STATES_TOP} || echo " - postgres.client" >> ${STATES_TOP} + + ### If we don't install and run LE before arvados-api-server, it fails and breaks everything + ### after it. So we add this here as we are, after all, sharing the host for api and controller + if [ "${ENABLE_BALANCER}" == "no" ]; then + if [ "${SSL_MODE}" = "lets-encrypt" ]; then + if [ "x${USE_LETSENCRYPT_ROUTE53:-}" = "xyes" ]; then + grep -q "aws_credentials" ${STATES_TOP} || echo " - aws_credentials" >> ${STATES_TOP} + fi + grep -q "letsencrypt" ${STATES_TOP} || echo " - letsencrypt" >> ${STATES_TOP} + elif [ "${SSL_MODE}" = "bring-your-own" ]; then + copy_custom_cert ${CUSTOM_CERTS_DIR} ${R} + grep -q controller ${P_DIR}/extra_custom_certs.sls || echo " - controller" >> ${P_DIR}/extra_custom_certs.sls fi - grep -q controller ${P_DIR}/extra_custom_certs.sls || echo " - controller" >> ${P_DIR}/extra_custom_certs.sls fi - grep -q "arvados.${R}" ${S_DIR}/top.sls || echo " - arvados.${R}" >> ${S_DIR}/top.sls - # Pillars - grep -q "aws_credentials" ${P_DIR}/top.sls || echo " - aws_credentials" >> ${P_DIR}/top.sls - grep -q "postgresql" ${P_DIR}/top.sls || echo " - postgresql" >> ${P_DIR}/top.sls - grep -q "nginx_passenger" ${P_DIR}/top.sls || echo " - nginx_passenger" >> ${P_DIR}/top.sls - grep -q "nginx_${R}_configuration" ${P_DIR}/top.sls || echo " - nginx_${R}_configuration" >> ${P_DIR}/top.sls + grep -q "arvados.api" ${STATES_TOP} || echo " - arvados.api" >> ${STATES_TOP} + grep -q "arvados.controller" ${STATES_TOP} || echo " - arvados.controller" >> ${STATES_TOP} + + ### Pillars ### + grep -q "logrotate_api" ${PILLARS_TOP} || echo " - logrotate_api" >> ${PILLARS_TOP} + grep -q "aws_credentials" ${PILLARS_TOP} || echo " - aws_credentials" >> ${PILLARS_TOP} + grep -q "postgresql" ${PILLARS_TOP} || echo " - postgresql" >> ${PILLARS_TOP} + grep -q "nginx_passenger" ${PILLARS_TOP} || echo " - nginx_passenger" >> ${PILLARS_TOP} + grep -q "nginx_api_configuration" ${PILLARS_TOP} || echo " - nginx_api_configuration" >> ${PILLARS_TOP} + grep -q "nginx_controller_configuration" ${PILLARS_TOP} || echo " - nginx_controller_configuration" >> ${PILLARS_TOP} + + if [ "${ENABLE_BALANCER}" == "no" ]; then + if [ "${SSL_MODE}" = "lets-encrypt" ]; then + if [ "${USE_LETSENCRYPT_ROUTE53}" = "yes" ]; then + grep -q "aws_credentials" ${PILLARS_TOP} || echo " - aws_credentials" >> ${PILLARS_TOP} + fi + grep -q "letsencrypt" ${PILLARS_TOP} || echo " - letsencrypt" >> ${PILLARS_TOP} + grep -q "letsencrypt_${R}_configuration" ${PILLARS_TOP} || echo " - letsencrypt_${R}_configuration" >> ${PILLARS_TOP} + sed -i "s/__CERT_REQUIRES__/cmd: create-initial-cert-${R}.${DOMAIN}*/g; + s#__CERT_PEM__#/etc/letsencrypt/live/${R}.${DOMAIN}/fullchain.pem#g; + s#__CERT_KEY__#/etc/letsencrypt/live/${R}.${DOMAIN}/privkey.pem#g" \ + ${P_DIR}/nginx_${R}_configuration.sls + else + grep -q "ssl_key_encrypted" ${PILLARS_TOP} || echo " - ssl_key_encrypted" >> ${PILLARS_TOP} + sed -i "s/__CERT_REQUIRES__/file: extra_custom_certs_${R}_cert_file_copy/g; + s#__CERT_PEM__#/etc/nginx/ssl/arvados-${R}.pem#g; + s#__CERT_KEY__#/etc/nginx/ssl/arvados-${R}.key#g" \ + ${P_DIR}/nginx_${R}_configuration.sls + grep -q ${R} ${P_DIR}/extra_custom_certs.sls || echo " - ${R}" >> ${P_DIR}/extra_custom_certs.sls + fi + fi # We need to tweak the Nginx's pillar depending whether we want plain nginx or nginx+passenger NGINX_INSTALL_SOURCE="install_from_phusionpassenger" sed -i "s/__NGINX_INSTALL_SOURCE__/${NGINX_INSTALL_SOURCE}/g" ${P_DIR}/nginx_passenger.sls ;; - "controller" | "websocket" | "workbench" | "workbench2" | "webshell" | "keepweb" | "keepproxy") - # States + "websocket" | "workbench" | "workbench2" | "webshell" | "keepweb" | "keepproxy") + ### States ### if [ "${R}" = "workbench" ]; then + grep -q " - logrotate" ${STATES_TOP} || echo " - logrotate" >> ${STATES_TOP} NGINX_INSTALL_SOURCE="install_from_phusionpassenger" - if grep -q " - nginx$" ${S_DIR}/top.sls; then - sed -i s/"^ - nginx.*$"/" - nginx.passenger"/g ${S_DIR}/top.sls + if grep -q " - nginx$" ${STATES_TOP}; then + sed -i s/"^ - nginx.*$"/" - nginx.passenger"/g ${STATES_TOP} else - echo " - nginx.passenger" >> ${S_DIR}/top.sls + echo " - nginx.passenger" >> ${STATES_TOP} fi else - grep -q "nginx" ${S_DIR}/top.sls || echo " - nginx" >> ${S_DIR}/top.sls + grep -q "\- nginx$" ${STATES_TOP} || echo " - nginx" >> ${STATES_TOP} fi + if [ "${SSL_MODE}" = "lets-encrypt" ]; then - if [ "x${USE_LETSENCRYPT_ROUTE53}" = "xyes" ]; then - grep -q "aws_credentials" ${S_DIR}/top.sls || echo " - aws_credentials" >> ${S_DIR}/top.sls + if [ "x${USE_LETSENCRYPT_ROUTE53:-}" = "xyes" ]; then + grep -q "aws_credentials" ${STATES_TOP} || echo " - aws_credentials" >> ${STATES_TOP} fi - grep -q "letsencrypt" ${S_DIR}/top.sls || echo " - letsencrypt" >> ${S_DIR}/top.sls + grep -q "letsencrypt" ${STATES_TOP} || echo " - letsencrypt" >> ${STATES_TOP} else # Use custom certs, special case for keepweb if [ ${R} = "keepweb" ]; then @@ -694,54 +903,60 @@ else fi fi fi + # webshell role is just a nginx vhost, so it has no state if [ "${R}" != "webshell" ]; then - grep -q "arvados.${R}" ${S_DIR}/top.sls || echo " - arvados.${R}" >> ${S_DIR}/top.sls + grep -q "arvados.${R}" ${STATES_TOP} || echo " - arvados.${R}" >> ${STATES_TOP} fi - # Pillars - grep -q "nginx_passenger" ${P_DIR}/top.sls || echo " - nginx_passenger" >> ${P_DIR}/top.sls - grep -q "nginx_${R}_configuration" ${P_DIR}/top.sls || echo " - nginx_${R}_configuration" >> ${P_DIR}/top.sls + + ### Pillars ### + if [ "${R}" = "workbench" ]; then + grep -q "logrotate_wb1" ${PILLARS_TOP} || echo " - logrotate_wb1" >> ${PILLARS_TOP} + fi + grep -q "nginx_passenger" ${PILLARS_TOP} || echo " - nginx_passenger" >> ${PILLARS_TOP} + grep -q "nginx_${R}_configuration" ${PILLARS_TOP} || echo " - nginx_${R}_configuration" >> ${PILLARS_TOP} # Special case for keepweb if [ ${R} = "keepweb" ]; then - grep -q "nginx_download_configuration" ${P_DIR}/top.sls || echo " - nginx_download_configuration" >> ${P_DIR}/top.sls - grep -q "nginx_collections_configuration" ${P_DIR}/top.sls || echo " - nginx_collections_configuration" >> ${P_DIR}/top.sls + grep -q "nginx_download_configuration" ${PILLARS_TOP} || echo " - nginx_download_configuration" >> ${PILLARS_TOP} + grep -q "nginx_collections_configuration" ${PILLARS_TOP} || echo " - nginx_collections_configuration" >> ${PILLARS_TOP} fi if [ "${SSL_MODE}" = "lets-encrypt" ]; then if [ "${USE_LETSENCRYPT_ROUTE53}" = "yes" ]; then - grep -q "aws_credentials" ${P_DIR}/top.sls || echo " - aws_credentials" >> ${P_DIR}/top.sls + grep -q "aws_credentials" ${PILLARS_TOP} || echo " - aws_credentials" >> ${PILLARS_TOP} fi - grep -q "letsencrypt" ${P_DIR}/top.sls || echo " - letsencrypt" >> ${P_DIR}/top.sls - grep -q "letsencrypt_${R}_configuration" ${P_DIR}/top.sls || echo " - letsencrypt_${R}_configuration" >> ${P_DIR}/top.sls + grep -q "letsencrypt" ${PILLARS_TOP} || echo " - letsencrypt" >> ${PILLARS_TOP} + grep -q "letsencrypt_${R}_configuration" ${PILLARS_TOP} || echo " - letsencrypt_${R}_configuration" >> ${PILLARS_TOP} # As the pillar differ whether we use LE or custom certs, we need to do a final edition on them # Special case for keepweb if [ ${R} = "keepweb" ]; then for kwsub in download collections; do - sed -i "s/__CERT_REQUIRES__/cmd: create-initial-cert-${kwsub}.${CLUSTER}.${DOMAIN}*/g; - s#__CERT_PEM__#/etc/letsencrypt/live/${kwsub}.${CLUSTER}.${DOMAIN}/fullchain.pem#g; - s#__CERT_KEY__#/etc/letsencrypt/live/${kwsub}.${CLUSTER}.${DOMAIN}/privkey.pem#g" \ + sed -i "s/__CERT_REQUIRES__/cmd: create-initial-cert-${kwsub}.${DOMAIN}*/g; + s#__CERT_PEM__#/etc/letsencrypt/live/${kwsub}.${DOMAIN}/fullchain.pem#g; + s#__CERT_KEY__#/etc/letsencrypt/live/${kwsub}.${DOMAIN}/privkey.pem#g" \ ${P_DIR}/nginx_${kwsub}_configuration.sls done else - sed -i "s/__CERT_REQUIRES__/cmd: create-initial-cert-${R}.${CLUSTER}.${DOMAIN}*/g; - s#__CERT_PEM__#/etc/letsencrypt/live/${R}.${CLUSTER}.${DOMAIN}/fullchain.pem#g; - s#__CERT_KEY__#/etc/letsencrypt/live/${R}.${CLUSTER}.${DOMAIN}/privkey.pem#g" \ + sed -i "s/__CERT_REQUIRES__/cmd: create-initial-cert-${R}.${DOMAIN}*/g; + s#__CERT_PEM__#/etc/letsencrypt/live/${R}.${DOMAIN}/fullchain.pem#g; + s#__CERT_KEY__#/etc/letsencrypt/live/${R}.${DOMAIN}/privkey.pem#g" \ ${P_DIR}/nginx_${R}_configuration.sls fi else + grep -q "ssl_key_encrypted" ${PILLARS_TOP} || echo " - ssl_key_encrypted" >> ${PILLARS_TOP} # As the pillar differ whether we use LE or custom certs, we need to do a final edition on them # Special case for keepweb if [ ${R} = "keepweb" ]; then for kwsub in download collections; do - sed -i "s/__CERT_REQUIRES__/file: extra_custom_certs_file_copy_arvados-${kwsub}.pem/g; + sed -i "s/__CERT_REQUIRES__/file: extra_custom_certs_${kwsub}_cert_file_copy/g; s#__CERT_PEM__#/etc/nginx/ssl/arvados-${kwsub}.pem#g; s#__CERT_KEY__#/etc/nginx/ssl/arvados-${kwsub}.key#g" \ ${P_DIR}/nginx_${kwsub}_configuration.sls grep -q ${kwsub} ${P_DIR}/extra_custom_certs.sls || echo " - ${kwsub}" >> ${P_DIR}/extra_custom_certs.sls done else - sed -i "s/__CERT_REQUIRES__/file: extra_custom_certs_file_copy_arvados-${R}.pem/g; + sed -i "s/__CERT_REQUIRES__/file: extra_custom_certs_${R}_cert_file_copy/g; s#__CERT_PEM__#/etc/nginx/ssl/arvados-${R}.pem#g; s#__CERT_KEY__#/etc/nginx/ssl/arvados-${R}.key#g" \ ${P_DIR}/nginx_${R}_configuration.sls @@ -753,14 +968,16 @@ else ;; "shell") # States - grep -q "docker" ${S_DIR}/top.sls || echo " - docker.software" >> ${S_DIR}/top.sls - grep -q "arvados.${R}" ${S_DIR}/top.sls || echo " - arvados.${R}" >> ${S_DIR}/top.sls + echo " - extra.shell_sudo_passwordless" >> ${STATES_TOP} + echo " - extra.shell_cron_add_login_sync" >> ${STATES_TOP} + grep -q "docker" ${STATES_TOP} || echo " - docker.software" >> ${STATES_TOP} + grep -q "arvados.${R}" ${STATES_TOP} || echo " - arvados.${R}" >> ${STATES_TOP} # Pillars - grep -q "docker" ${P_DIR}/top.sls || echo " - docker" >> ${P_DIR}/top.sls + grep -q "docker" ${PILLARS_TOP} || echo " - docker" >> ${PILLARS_TOP} ;; "dispatcher" | "keepbalance" | "keepstore") # States - grep -q "arvados.${R}" ${S_DIR}/top.sls || echo " - arvados.${R}" >> ${S_DIR}/top.sls + grep -q "arvados.${R}" ${STATES_TOP} || echo " - arvados.${R}" >> ${STATES_TOP} # Pillars # ATM, no specific pillar needed ;; @@ -777,21 +994,8 @@ if [ "${DUMP_CONFIG}" = "yes" ]; then exit 0 fi -# FIXME! #16992 Temporary fix for psql call in arvados-api-server -if [ -e /root/.psqlrc ]; then - if ! ( grep 'pset pager off' /root/.psqlrc ); then - RESTORE_PSQL="yes" - cp /root/.psqlrc /root/.psqlrc.provision.backup - fi -else - DELETE_PSQL="yes" -fi - -echo '\pset pager off' >> /root/.psqlrc -# END FIXME! #16992 Temporary fix for psql call in arvados-api-server - # Now run the install -salt-call --local state.apply -l ${LOG_LEVEL} +salt-call --state-output=mixed --local state.apply -l ${LOG_LEVEL} # Finally, make sure that /etc/hosts is not overwritten on reboot if [ -d /etc/cloud/cloud.cfg.d ]; then @@ -799,34 +1003,24 @@ if [ -d /etc/cloud/cloud.cfg.d ]; then sed -i 's/^manage_etc_hosts: true/#manage_etc_hosts: true/g' /etc/cloud/cloud.cfg.d/* fi -# FIXME! #16992 Temporary fix for psql call in arvados-api-server -if [ "x${DELETE_PSQL}" = "xyes" ]; then - echo "Removing .psql file" - rm /root/.psqlrc -fi - -if [ "x${RESTORE_PSQL}" = "xyes" ]; then - echo "Restoring .psql file" - mv -v /root/.psqlrc.provision.backup /root/.psqlrc -fi -# END FIXME! #16992 Temporary fix for psql call in arvados-api-server - # Leave a copy of the Arvados CA so the user can copy it where it's required -if [ "$DEV_MODE" = "yes" ]; then - echo "Copying the Arvados CA certificate to the installer dir, so you can import it" - # If running in a vagrant VM, also add default user to docker group - if [ "x${VAGRANT}" = "xyes" ]; then - cp /etc/ssl/certs/arvados-snakeoil-ca.pem /vagrant/${CLUSTER}.${DOMAIN}-arvados-snakeoil-ca.pem +if [ "${SSL_MODE}" = "self-signed" ]; then + echo "Copying the Arvados CA certificate '${DOMAIN}-arvados-snakeoil-ca.crt' to the installer dir, so you can import it" + if [ "x${VAGRANT:-}" = "xyes" ]; then + cp /etc/ssl/certs/arvados-snakeoil-ca.pem /vagrant/${DOMAIN}-arvados-snakeoil-ca.pem + else + cp /etc/ssl/certs/arvados-snakeoil-ca.pem ${SCRIPT_DIR}/${DOMAIN}-arvados-snakeoil-ca.crt + fi +fi +if [ "x${VAGRANT:-}" = "xyes" ]; then + # If running in a vagrant VM, also add default user to docker group echo "Adding the vagrant user to the docker group" usermod -a -G docker vagrant - else - cp /etc/ssl/certs/arvados-snakeoil-ca.pem ${SCRIPT_DIR}/${CLUSTER}.${DOMAIN}-arvados-snakeoil-ca.pem - fi fi # Test that the installation finished correctly -if [ "x${TEST}" = "xyes" ]; then +if [ "x${TEST:-}" = "xyes" ]; then cd ${T_DIR} # If we use RVM, we need to run this with it, or most ruby commands will fail RVM_EXEC=""