80b1ed301f7c7b632734d34de57fc0daeea9b0e8
[arvados.git] / services / keep-balance / main.go
1 // Copyright (C) The Arvados Authors. All rights reserved.
2 //
3 // SPDX-License-Identifier: AGPL-3.0
4
5 package main
6
7 import (
8         "context"
9         "flag"
10         "fmt"
11         "io"
12         "os"
13
14         "git.arvados.org/arvados.git/lib/config"
15         "git.arvados.org/arvados.git/lib/service"
16         "git.arvados.org/arvados.git/sdk/go/arvados"
17         "git.arvados.org/arvados.git/sdk/go/ctxlog"
18         "git.arvados.org/arvados.git/sdk/go/health"
19         "github.com/jmoiron/sqlx"
20         "github.com/prometheus/client_golang/prometheus"
21         "github.com/sirupsen/logrus"
22 )
23
24 func main() {
25         os.Exit(runCommand(os.Args[0], os.Args[1:], os.Stdin, os.Stdout, os.Stderr))
26 }
27
28 func runCommand(prog string, args []string, stdin io.Reader, stdout, stderr io.Writer) int {
29         logger := ctxlog.FromContext(context.Background())
30
31         var options RunOptions
32         flags := flag.NewFlagSet(prog, flag.ExitOnError)
33         flags.BoolVar(&options.Once, "once", false,
34                 "balance once and then exit")
35         flags.BoolVar(&options.CommitPulls, "commit-pulls", false,
36                 "send pull requests (make more replicas of blocks that are underreplicated or are not in optimal rendezvous probe order)")
37         flags.BoolVar(&options.CommitTrash, "commit-trash", false,
38                 "send trash requests (delete unreferenced old blocks, and excess replicas of overreplicated blocks)")
39         flags.Bool("version", false, "Write version information to stdout and exit 0")
40         dumpFlag := flags.Bool("dump", false, "dump details for each block to stdout")
41
42         loader := config.NewLoader(os.Stdin, logger)
43         loader.SetupFlags(flags)
44
45         munged := loader.MungeLegacyConfigArgs(logger, args, "-legacy-keepbalance-config")
46         flags.Parse(munged)
47
48         if *dumpFlag {
49                 dumper := logrus.New()
50                 dumper.Out = os.Stdout
51                 dumper.Formatter = &logrus.TextFormatter{}
52                 options.Dumper = dumper
53         }
54
55         // Drop our custom args that would be rejected by the generic
56         // service.Command
57         args = nil
58         dropFlag := map[string]bool{
59                 "once":         true,
60                 "commit-pulls": true,
61                 "commit-trash": true,
62                 "dump":         true,
63         }
64         flags.Visit(func(f *flag.Flag) {
65                 if !dropFlag[f.Name] {
66                         args = append(args, "-"+f.Name, f.Value.String())
67                 }
68         })
69
70         return service.Command(arvados.ServiceNameKeepbalance,
71                 func(ctx context.Context, cluster *arvados.Cluster, token string, registry *prometheus.Registry) service.Handler {
72                         if !options.Once && cluster.Collections.BalancePeriod == arvados.Duration(0) {
73                                 return service.ErrorHandler(ctx, cluster, fmt.Errorf("cannot start service: Collections.BalancePeriod is zero (if you want to run once and then exit, use the -once flag)"))
74                         }
75
76                         ac, err := arvados.NewClientFromConfig(cluster)
77                         ac.AuthToken = token
78                         if err != nil {
79                                 return service.ErrorHandler(ctx, cluster, fmt.Errorf("error initializing client from cluster config: %s", err))
80                         }
81
82                         db, err := sqlx.Open("postgres", cluster.PostgreSQL.Connection.String())
83                         if err != nil {
84                                 return service.ErrorHandler(ctx, cluster, fmt.Errorf("postgresql connection failed: %s", err))
85                         }
86                         if p := cluster.PostgreSQL.ConnectionPool; p > 0 {
87                                 db.SetMaxOpenConns(p)
88                         }
89                         err = db.Ping()
90                         if err != nil {
91                                 return service.ErrorHandler(ctx, cluster, fmt.Errorf("postgresql connection succeeded but ping failed: %s", err))
92                         }
93
94                         if options.Logger == nil {
95                                 options.Logger = ctxlog.FromContext(ctx)
96                         }
97
98                         srv := &Server{
99                                 Cluster:    cluster,
100                                 ArvClient:  ac,
101                                 RunOptions: options,
102                                 Metrics:    newMetrics(registry),
103                                 Logger:     options.Logger,
104                                 Dumper:     options.Dumper,
105                                 DB:         db,
106                         }
107                         srv.Handler = &health.Handler{
108                                 Token:  cluster.ManagementToken,
109                                 Prefix: "/_health/",
110                                 Routes: health.Routes{"ping": srv.CheckHealth},
111                         }
112
113                         go srv.run()
114                         return srv
115                 }).RunCommand(prog, args, stdin, stdout, stderr)
116 }