1 // Copyright (C) The Arvados Authors. All rights reserved.
3 // SPDX-License-Identifier: Apache-2.0
13 "git.curoverse.com/arvados.git/sdk/go/config"
16 const DefaultConfigFile = "/etc/arvados/config.yml"
19 Clusters map[string]Cluster
22 // GetConfig returns the current system config, loading it from
23 // configFile if needed.
24 func GetConfig(configFile string) (*Config, error) {
26 err := config.LoadFile(&cfg, configFile)
30 // GetCluster returns the cluster ID and config for the given
31 // cluster, or the default/only configured cluster if clusterID is "".
32 func (sc *Config) GetCluster(clusterID string) (*Cluster, error) {
34 if len(sc.Clusters) == 0 {
35 return nil, fmt.Errorf("no clusters configured")
36 } else if len(sc.Clusters) > 1 {
37 return nil, fmt.Errorf("multiple clusters configured, cannot choose")
39 for id, cc := range sc.Clusters {
45 if cc, ok := sc.Clusters[clusterID]; !ok {
46 return nil, fmt.Errorf("cluster %q is not configured", clusterID)
48 cc.ClusterID = clusterID
53 type RequestLimits struct {
54 MaxItemsPerResponse int
55 MultiClusterRequestConcurrency int
59 ClusterID string `json:"-"`
60 ManagementToken string
61 NodeProfiles map[string]NodeProfile
62 InstanceTypes InstanceTypeMap
65 HTTPRequestTimeout Duration
66 RemoteClusters map[string]RemoteCluster
68 RequestLimits RequestLimits
71 type PostgreSQL struct {
72 Connection PostgreSQLConnection
76 type PostgreSQLConnection map[string]string
78 type RemoteCluster struct {
79 // API endpoint host or host:port; default is {id}.arvadosapi.com
81 // Perform a proxy request when a local client requests an
82 // object belonging to this remote.
84 // Scheme, default "https". Can be set to "http" for testing.
86 // Disable TLS verify. Can be set to true for testing.
90 type InstanceType struct {
100 type Dispatch struct {
101 // PEM encoded SSH key (RSA, DSA, or ECDSA) able to log in to
105 // Max time for workers to come up before abandoning stale
106 // locks from previous run
107 StaleLockTimeout Duration
109 // Interval between queue polls
110 PollInterval Duration
112 // Interval between probes to each worker
113 ProbeInterval Duration
115 // Maximum total worker probes per second
116 MaxProbesPerSecond int
119 type CloudVMs struct {
120 // Shell command that exits zero IFF the VM is fully booted
121 // and ready to run containers, e.g., "mount | grep
123 BootProbeCommand string
124 SyncInterval Duration
126 // Maximum idle time before automatic shutdown
129 // Maximum booting time before automatic shutdown
130 TimeoutBooting Duration
132 // Maximum time with no successful probes before automatic shutdown
133 TimeoutProbe Duration
135 // Time after shutdown to retry shutdown
136 TimeoutShutdown Duration
141 DriverParameters map[string]interface{}
144 type InstanceTypeMap map[string]InstanceType
146 var errDuplicateInstanceTypeName = errors.New("duplicate instance type name")
148 // UnmarshalJSON handles old config files that provide an array of
149 // instance types instead of a hash.
150 func (it *InstanceTypeMap) UnmarshalJSON(data []byte) error {
151 if len(data) > 0 && data[0] == '[' {
152 var arr []InstanceType
153 err := json.Unmarshal(data, &arr)
161 *it = make(map[string]InstanceType, len(arr))
162 for _, t := range arr {
163 if _, ok := (*it)[t.Name]; ok {
164 return errDuplicateInstanceTypeName
170 var hash map[string]InstanceType
171 err := json.Unmarshal(data, &hash)
175 // Fill in Name field using hash key.
176 *it = InstanceTypeMap(hash)
177 for name, t := range *it {
184 // GetNodeProfile returns a NodeProfile for the given hostname. An
185 // error is returned if the appropriate configuration can't be
186 // determined (e.g., this does not appear to be a system node). If
187 // node is empty, use the OS-reported hostname.
188 func (cc *Cluster) GetNodeProfile(node string) (*NodeProfile, error) {
190 hostname, err := os.Hostname()
196 if cfg, ok := cc.NodeProfiles[node]; ok {
199 // If node is not listed, but "*" gives a default system node
200 // config, use the default config.
201 if cfg, ok := cc.NodeProfiles["*"]; ok {
204 return nil, fmt.Errorf("config does not provision host %q as a system node", node)
207 type NodeProfile struct {
208 Controller SystemServiceInstance `json:"arvados-controller"`
209 Health SystemServiceInstance `json:"arvados-health"`
210 Keepbalance SystemServiceInstance `json:"keep-balance"`
211 Keepproxy SystemServiceInstance `json:"keepproxy"`
212 Keepstore SystemServiceInstance `json:"keepstore"`
213 Keepweb SystemServiceInstance `json:"keep-web"`
214 Nodemanager SystemServiceInstance `json:"arvados-node-manager"`
215 DispatchCloud SystemServiceInstance `json:"arvados-dispatch-cloud"`
216 RailsAPI SystemServiceInstance `json:"arvados-api-server"`
217 Websocket SystemServiceInstance `json:"arvados-ws"`
218 Workbench SystemServiceInstance `json:"arvados-workbench"`
221 type ServiceName string
224 ServiceNameRailsAPI ServiceName = "arvados-api-server"
225 ServiceNameController ServiceName = "arvados-controller"
226 ServiceNameDispatchCloud ServiceName = "arvados-dispatch-cloud"
227 ServiceNameNodemanager ServiceName = "arvados-node-manager"
228 ServiceNameWorkbench ServiceName = "arvados-workbench"
229 ServiceNameWebsocket ServiceName = "arvados-ws"
230 ServiceNameKeepbalance ServiceName = "keep-balance"
231 ServiceNameKeepweb ServiceName = "keep-web"
232 ServiceNameKeepproxy ServiceName = "keepproxy"
233 ServiceNameKeepstore ServiceName = "keepstore"
236 // ServicePorts returns the configured listening address (or "" if
237 // disabled) for each service on the node.
238 func (np *NodeProfile) ServicePorts() map[ServiceName]string {
239 return map[ServiceName]string{
240 ServiceNameRailsAPI: np.RailsAPI.Listen,
241 ServiceNameController: np.Controller.Listen,
242 ServiceNameDispatchCloud: np.DispatchCloud.Listen,
243 ServiceNameNodemanager: np.Nodemanager.Listen,
244 ServiceNameWorkbench: np.Workbench.Listen,
245 ServiceNameWebsocket: np.Websocket.Listen,
246 ServiceNameKeepbalance: np.Keepbalance.Listen,
247 ServiceNameKeepweb: np.Keepweb.Listen,
248 ServiceNameKeepproxy: np.Keepproxy.Listen,
249 ServiceNameKeepstore: np.Keepstore.Listen,
253 func (h RequestLimits) GetMultiClusterRequestConcurrency() int {
254 if h.MultiClusterRequestConcurrency == 0 {
257 return h.MultiClusterRequestConcurrency
260 func (h RequestLimits) GetMaxItemsPerResponse() int {
261 if h.MaxItemsPerResponse == 0 {
264 return h.MaxItemsPerResponse
267 type SystemServiceInstance struct {