X-Git-Url: https://git.arvados.org/arvados.git/blobdiff_plain/2361a96130524ee57b0e1d652d560e8e31993b04..a4fc0df348d192c2b147d4964c0dfa4079e2181f:/lib/install/init.go diff --git a/lib/install/init.go b/lib/install/init.go index 2257fc57c4..14e2eaafab 100644 --- a/lib/install/init.go +++ b/lib/install/init.go @@ -13,16 +13,24 @@ import ( "flag" "fmt" "io" + "net" + "net/http" + "net/url" "os" "os/exec" "os/user" "regexp" "strconv" + "strings" + "sync/atomic" "text/template" + "time" "git.arvados.org/arvados.git/lib/cmd" "git.arvados.org/arvados.git/lib/config" + "git.arvados.org/arvados.git/lib/controller/rpc" "git.arvados.org/arvados.git/sdk/go/arvados" + "git.arvados.org/arvados.git/sdk/go/auth" "git.arvados.org/arvados.git/sdk/go/ctxlog" "github.com/lib/pq" ) @@ -35,7 +43,14 @@ type initCommand struct { PostgreSQLPassword string Login string TLS string + AdminEmail string Start bool + + LoginPAM bool + LoginTest bool + LoginGoogle bool + LoginGoogleClientID string + LoginGoogleClientSecret string } func (initcmd *initCommand) RunCommand(prog string, args []string, stdin io.Reader, stdout, stderr io.Writer) int { @@ -62,7 +77,8 @@ func (initcmd *initCommand) RunCommand(prog string, args []string, stdin io.Read versionFlag := flags.Bool("version", false, "Write version information to stdout and exit 0") flags.StringVar(&initcmd.ClusterID, "cluster-id", "", "cluster `id`, like x1234 for a dev cluster") flags.StringVar(&initcmd.Domain, "domain", hostname, "cluster public DNS `name`, like x1234.arvadosapi.com") - flags.StringVar(&initcmd.Login, "login", "", "login `backend`: test, pam, or ''") + flags.StringVar(&initcmd.Login, "login", "", "login `backend`: test, pam, 'google {client-id} {client-secret}', or ''") + flags.StringVar(&initcmd.AdminEmail, "admin-email", "", "give admin privileges to user with given `email`") flags.StringVar(&initcmd.TLS, "tls", "none", "tls certificate `source`: acme, auto, insecure, or none") flags.BoolVar(&initcmd.Start, "start", true, "start systemd service after creating config") if ok, code := cmd.ParseFlags(flags, prog, args, "", stderr); !ok { @@ -74,6 +90,62 @@ func (initcmd *initCommand) RunCommand(prog string, args []string, stdin io.Read return 1 } + if fields := strings.Fields(initcmd.Login); len(fields) == 3 && fields[0] == "google" { + initcmd.LoginGoogle = true + initcmd.LoginGoogleClientID = fields[1] + initcmd.LoginGoogleClientSecret = fields[2] + } else if initcmd.Login == "test" { + initcmd.LoginTest = true + if initcmd.AdminEmail == "" { + initcmd.AdminEmail = "admin@example.com" + } + } else if initcmd.Login == "pam" { + initcmd.LoginPAM = true + } else if initcmd.Login == "" { + // none; login will show an error page + } else { + err = fmt.Errorf("invalid argument to -login: %q: should be 'test', 'pam', 'google {client-id} {client-secret}', or empty", initcmd.Login) + return 1 + } + + confdir := "/etc/arvados" + conffile := confdir + "/config.yml" + if _, err = os.Stat(conffile); err == nil { + err = fmt.Errorf("config file %s already exists; delete it first if you really want to start over", conffile) + return 1 + } + + ports := []int{443} + for i := 4440; i < 4460; i++ { + ports = append(ports, i) + } + if initcmd.TLS == "acme" { + ports = append(ports, 80) + } + for _, port := range ports { + err = initcmd.checkPort(ctx, fmt.Sprintf("%d", port)) + if err != nil { + return 1 + } + } + + // Do the "create extension" thing early. This way, if there's + // no local postgresql server (a likely failure mode), we can + // bail out without any side effects, and the user can start + // over easily. + fmt.Fprintln(stderr, "installing pg_trgm postgresql extension...") + cmd := exec.CommandContext(ctx, "sudo", "-u", "postgres", "psql", "--quiet", + "-c", `CREATE EXTENSION IF NOT EXISTS pg_trgm`) + cmd.Dir = "/" + cmd.Stdout = stdout + cmd.Stderr = stderr + err = cmd.Run() + if err != nil { + err = fmt.Errorf("error preparing postgresql server: %w", err) + return 1 + } + fmt.Fprintln(stderr, "...done") + wwwuser, err := user.Lookup("www-data") if err != nil { err = fmt.Errorf("user.Lookup(%q): %w", "www-data", err) @@ -85,22 +157,28 @@ func (initcmd *initCommand) RunCommand(prog string, args []string, stdin io.Read } initcmd.PostgreSQLPassword = initcmd.RandomHex(32) + fmt.Fprintln(stderr, "creating data storage directory /var/lib/arvados/keep ...") err = os.Mkdir("/var/lib/arvados/keep", 0600) if err != nil && !os.IsExist(err) { err = fmt.Errorf("mkdir /var/lib/arvados/keep: %w", err) return 1 } - fmt.Fprintln(stderr, "created /var/lib/arvados/keep") + fmt.Fprintln(stderr, "...done") - err = os.Mkdir("/etc/arvados", 0750) + fmt.Fprintln(stderr, "creating config file", conffile, "...") + err = os.Mkdir(confdir, 0750) if err != nil && !os.IsExist(err) { - err = fmt.Errorf("mkdir /etc/arvados: %w", err) + err = fmt.Errorf("mkdir %s: %w", confdir, err) + return 1 + } + err = os.Chown(confdir, 0, wwwgid) + if err != nil { + err = fmt.Errorf("chown 0:%d %s: %w", wwwgid, confdir, err) return 1 } - err = os.Chown("/etc/arvados", 0, wwwgid) - f, err := os.OpenFile("/etc/arvados/config.yml", os.O_CREATE|os.O_EXCL|os.O_WRONLY, 0644) + f, err := os.OpenFile(conffile+".tmp", os.O_CREATE|os.O_EXCL|os.O_WRONLY, 0644) if err != nil { - err = fmt.Errorf("open /etc/arvados/config.yml: %w", err) + err = fmt.Errorf("open %s: %w", conffile+".tmp", err) return 1 } tmpl, err := template.New("config").Parse(`Clusters: @@ -116,7 +194,7 @@ func (initcmd *initCommand) RunCommand(prog string, args []string, stdin io.Read Websocket: InternalURLs: "http://0.0.0.0:8005/": {} - ExternalURL: {{printf "%q" ( print "wss://" .Domain ":4436/" ) }} + ExternalURL: {{printf "%q" ( print "wss://" .Domain ":4446/" ) }} Keepbalance: InternalURLs: "http://0.0.0.0:9019/": {} @@ -168,7 +246,7 @@ func (initcmd *initCommand) RunCommand(prog string, args []string, stdin io.Read ManagementToken: {{printf "%q" ( .RandomHex 50 )}} PostgreSQL: Connection: - dbname: arvados_production + dbname: arvados host: localhost user: arvados password: {{printf "%q" .PostgreSQLPassword}} @@ -192,47 +270,54 @@ func (initcmd *initCommand) RunCommand(prog string, args []string, stdin io.Read Replication: 2 Workbench: SecretKeyBase: {{printf "%q" ( .RandomHex 50 )}} + {{if .LoginPAM}} Login: - {{if eq .Login "pam"}} PAM: Enable: true - {{else if eq .Login "test"}} + {{else if .LoginTest}} + Login: Test: Enable: true Users: admin: - Email: admin@example.com + Email: {{printf "%q" .AdminEmail}} Password: admin - {{else}} - {} - {{end}} + {{else if .LoginGoogle}} + Login: + Google: + Enable: true + ClientID: {{printf "%q" .LoginGoogleClientID}} + ClientSecret: {{printf "%q" .LoginGoogleClientSecret}} + {{end}} Users: - {{if eq .Login "test"}} - AutoAdminUserWithEmail: admin@example.com - {{else}} - {} - {{end}} + AutoAdminUserWithEmail: {{printf "%q" .AdminEmail}} `) if err != nil { return 1 } err = tmpl.Execute(f, initcmd) if err != nil { - err = fmt.Errorf("/etc/arvados/config.yml: tmpl.Execute: %w", err) + err = fmt.Errorf("%s: tmpl.Execute: %w", conffile+".tmp", err) return 1 } err = f.Close() if err != nil { - err = fmt.Errorf("/etc/arvados/config.yml: close: %w", err) + err = fmt.Errorf("%s: close: %w", conffile+".tmp", err) return 1 } - fmt.Fprintln(stderr, "created /etc/arvados/config.yml") + err = os.Rename(conffile+".tmp", conffile) + if err != nil { + err = fmt.Errorf("rename %s -> %s: %w", conffile+".tmp", conffile, err) + return 1 + } + fmt.Fprintln(stderr, "...done") ldr := config.NewLoader(nil, logger) ldr.SkipLegacy = true + ldr.Path = conffile // load the file we just wrote, even if $ARVADOS_CONFIG is set cfg, err := ldr.Load() if err != nil { - err = fmt.Errorf("/etc/arvados/config.yml: %w", err) + err = fmt.Errorf("%s: %w", conffile, err) return 1 } cluster, err := cfg.GetCluster("") @@ -240,25 +325,28 @@ func (initcmd *initCommand) RunCommand(prog string, args []string, stdin io.Read return 1 } + fmt.Fprintln(stderr, "creating postresql user and database...") err = initcmd.createDB(ctx, cluster.PostgreSQL.Connection, stderr) if err != nil { return 1 } + fmt.Fprintln(stderr, "...done") - cmd := exec.CommandContext(ctx, "sudo", "-u", "www-data", "-E", "HOME=/var/www", "PATH=/var/lib/arvados/bin:"+os.Getenv("PATH"), "/var/lib/arvados/bin/bundle", "exec", "rake", "db:setup") + fmt.Fprintln(stderr, "initializing database...") + cmd = exec.CommandContext(ctx, "sudo", "-u", "www-data", "-E", "HOME=/var/www", "PATH=/var/lib/arvados/bin:"+os.Getenv("PATH"), "/var/lib/arvados/bin/bundle", "exec", "rake", "db:setup") cmd.Dir = "/var/lib/arvados/railsapi" cmd.Stdout = stderr cmd.Stderr = stderr err = cmd.Run() if err != nil { - err = fmt.Errorf("rake db:setup: %w", err) + err = fmt.Errorf("rake db:setup failed: %w", err) return 1 } - fmt.Fprintln(stderr, "initialized database") + fmt.Fprintln(stderr, "...done") if initcmd.Start { - fmt.Fprintln(stderr, "starting systemd service") - cmd := exec.CommandContext(ctx, "systemctl", "start", "--no-block", "arvados") + fmt.Fprintln(stderr, "starting systemd service...") + cmd := exec.CommandContext(ctx, "systemctl", "start", "arvados") cmd.Dir = "/" cmd.Stdout = stderr cmd.Stderr = stderr @@ -267,8 +355,50 @@ func (initcmd *initCommand) RunCommand(prog string, args []string, stdin io.Read err = fmt.Errorf("%v: %w", cmd.Args, err) return 1 } + fmt.Fprintln(stderr, "...done") + + fmt.Fprintln(stderr, "checking controller API endpoint...") + u := url.URL(cluster.Services.Controller.ExternalURL) + conn := rpc.NewConn(cluster.ClusterID, &u, cluster.TLS.Insecure, rpc.PassthroughTokenProvider) + ctx := auth.NewContext(context.Background(), auth.NewCredentials(cluster.SystemRootToken)) + _, err = conn.UserGetCurrent(ctx, arvados.GetOptions{}) + if err != nil { + err = fmt.Errorf("API request failed: %w", err) + return 1 + } + fmt.Fprintln(stderr, "...looks good") + } + + if out, err := exec.CommandContext(ctx, "docker", "version").CombinedOutput(); err == nil && strings.Contains(string(out), "\nServer:\n") { + fmt.Fprintln(stderr, "loading alpine docker image for diagnostics...") + cmd := exec.CommandContext(ctx, "docker", "pull", "alpine") + cmd.Stdout = stderr + cmd.Stderr = stderr + err = cmd.Run() + if err != nil { + err = fmt.Errorf("%v: %w", cmd.Args, err) + return 1 + } + cmd = exec.CommandContext(ctx, "arv", "sudo", "keep", "docker", "alpine") + cmd.Stdout = stderr + cmd.Stderr = stderr + err = cmd.Run() + if err != nil { + err = fmt.Errorf("%v: %w", cmd.Args, err) + return 1 + } + fmt.Fprintln(stderr, "...done") + } else { + fmt.Fprintln(stderr, "docker is not installed -- skipping step of downloading 'alpine' image") } + fmt.Fprintf(stderr, ` +Setup complete. Next steps: +* run 'arv sudo diagnostics' +* log in to workbench2 at %s +* see documentation at https://doc.arvados.org/install/automatic.html +`, cluster.Services.Workbench2.ExternalURL.String()) + return 0 } @@ -297,18 +427,98 @@ func (initcmd *initCommand) RandomHex(chars int) string { } func (initcmd *initCommand) createDB(ctx context.Context, dbconn arvados.PostgreSQLConnection, stderr io.Writer) error { - for _, sql := range []string{ - `CREATE USER ` + pq.QuoteIdentifier(dbconn["user"]) + ` WITH SUPERUSER ENCRYPTED PASSWORD ` + pq.QuoteLiteral(dbconn["password"]), - `CREATE DATABASE ` + pq.QuoteIdentifier(dbconn["dbname"]) + ` WITH TEMPLATE template0 ENCODING 'utf8'`, - `CREATE EXTENSION IF NOT EXISTS pg_trgm`, - } { - cmd := exec.CommandContext(ctx, "sudo", "-u", "postgres", "psql", "-c", sql) - cmd.Stdout = stderr - cmd.Stderr = stderr - err := cmd.Run() - if err != nil { - return fmt.Errorf("error setting up arvados user/database: %w", err) - } + cmd := exec.CommandContext(ctx, "sudo", "-u", "postgres", "psql", "--quiet", + "-c", `CREATE USER `+pq.QuoteIdentifier(dbconn["user"])+` WITH SUPERUSER ENCRYPTED PASSWORD `+pq.QuoteLiteral(dbconn["password"]), + "-c", `CREATE DATABASE `+pq.QuoteIdentifier(dbconn["dbname"])+` WITH TEMPLATE template0 ENCODING 'utf8'`, + ) + cmd.Dir = "/" + cmd.Stdout = stderr + cmd.Stderr = stderr + err := cmd.Run() + if err != nil { + return fmt.Errorf("error setting up arvados user/database: %w", err) + } + return nil +} + +// Confirm that http://{initcmd.Domain}:{port} reaches a server that +// we run on {port}. +// +// If port is "80", listening fails, and Nginx appears to be using the +// debian-packaged default configuration that listens on port 80, +// disable that Nginx config and try again. +// +// (Typically, the reason Nginx is installed is so that Arvados can +// run an Nginx child process; the default Nginx service using config +// from /etc/nginx is just an unfortunate side effect of installing +// Nginx by way of the Debian package.) +func (initcmd *initCommand) checkPort(ctx context.Context, port string) error { + err := initcmd.checkPortOnce(ctx, port) + if err == nil || port != "80" { + // success, or poking Nginx in the eye won't help + return err + } + d, err2 := os.Open("/etc/nginx/sites-enabled/.") + if err2 != nil { + return err + } + fis, err2 := d.Readdir(-1) + if err2 != nil || len(fis) != 1 { + return err + } + if target, err2 := os.Readlink("/etc/nginx/sites-enabled/default"); err2 != nil || target != "/etc/nginx/sites-available/default" { + return err + } + err2 = os.Remove("/etc/nginx/sites-enabled/default") + if err2 != nil { + return err + } + exec.CommandContext(ctx, "nginx", "-s", "reload").Run() + time.Sleep(time.Second) + return initcmd.checkPortOnce(ctx, port) +} + +// Start an http server on 0.0.0.0:{port} and confirm that +// http://{initcmd.Domain}:{port} reaches that server. +func (initcmd *initCommand) checkPortOnce(ctx context.Context, port string) error { + b := make([]byte, 128) + _, err := rand.Read(b) + if err != nil { + return err + } + token := fmt.Sprintf("%x", b) + + srv := http.Server{ + Addr: net.JoinHostPort("", port), + Handler: http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) { + fmt.Fprint(w, token) + })} + var errServe atomic.Value + go func() { + errServe.Store(srv.ListenAndServe()) + }() + defer srv.Close() + url := "http://" + net.JoinHostPort(initcmd.Domain, port) + "/probe" + req, err := http.NewRequestWithContext(ctx, "GET", url, nil) + if err != nil { + return err + } + resp, err := http.DefaultClient.Do(req) + if err == nil { + defer resp.Body.Close() + } + if errServe, _ := errServe.Load().(error); errServe != nil { + // If server already exited, return that error + // (probably "can't listen"), not the request error. + return errServe + } + if err != nil { + return err + } + buf := make([]byte, len(token)) + n, err := io.ReadFull(resp.Body, buf) + if string(buf[:n]) != token { + return fmt.Errorf("listened on port %s but %s connected to something else, returned %q, err %v", port, url, buf[:n], err) } return nil }