19385: Messy work in progress for uploading workflows to collections
[arvados.git] / sdk / go / arvados / config.go
1 // Copyright (C) The Arvados Authors. All rights reserved.
2 //
3 // SPDX-License-Identifier: Apache-2.0
4
5 package arvados
6
7 import (
8         "encoding/json"
9         "errors"
10         "fmt"
11         "net/url"
12         "os"
13         "time"
14
15         "git.arvados.org/arvados.git/sdk/go/config"
16 )
17
18 var DefaultConfigFile = func() string {
19         if path := os.Getenv("ARVADOS_CONFIG"); path != "" {
20                 return path
21         }
22         return "/etc/arvados/config.yml"
23 }()
24
25 type Config struct {
26         Clusters         map[string]Cluster
27         AutoReloadConfig bool
28         SourceTimestamp  time.Time
29         SourceSHA256     string
30 }
31
32 // GetConfig returns the current system config, loading it from
33 // configFile if needed.
34 func GetConfig(configFile string) (*Config, error) {
35         var cfg Config
36         err := config.LoadFile(&cfg, configFile)
37         return &cfg, err
38 }
39
40 // GetCluster returns the cluster ID and config for the given
41 // cluster, or the default/only configured cluster if clusterID is "".
42 func (sc *Config) GetCluster(clusterID string) (*Cluster, error) {
43         if clusterID == "" {
44                 if len(sc.Clusters) == 0 {
45                         return nil, fmt.Errorf("no clusters configured")
46                 } else if len(sc.Clusters) > 1 {
47                         return nil, fmt.Errorf("multiple clusters configured, cannot choose")
48                 } else {
49                         for id, cc := range sc.Clusters {
50                                 cc.ClusterID = id
51                                 return &cc, nil
52                         }
53                 }
54         }
55         cc, ok := sc.Clusters[clusterID]
56         if !ok {
57                 return nil, fmt.Errorf("cluster %q is not configured", clusterID)
58         }
59         cc.ClusterID = clusterID
60         return &cc, nil
61 }
62
63 type WebDAVCacheConfig struct {
64         TTL                Duration
65         MaxBlockEntries    int
66         MaxCollectionBytes int64
67         MaxSessions        int
68 }
69
70 type UploadDownloadPermission struct {
71         Upload   bool
72         Download bool
73 }
74
75 type UploadDownloadRolePermissions struct {
76         User  UploadDownloadPermission
77         Admin UploadDownloadPermission
78 }
79
80 type ManagedProperties map[string]struct {
81         Value     interface{}
82         Function  string
83         Protected bool
84 }
85
86 type Cluster struct {
87         ClusterID       string `json:"-"`
88         ManagementToken string
89         SystemRootToken string
90         Services        Services
91         InstanceTypes   InstanceTypeMap
92         Containers      ContainersConfig
93         RemoteClusters  map[string]RemoteCluster
94         PostgreSQL      PostgreSQL
95
96         API struct {
97                 AsyncPermissionsUpdateInterval   Duration
98                 DisabledAPIs                     StringSet
99                 MaxIndexDatabaseRead             int
100                 MaxItemsPerResponse              int
101                 MaxConcurrentRequests            int
102                 MaxKeepBlobBuffers               int
103                 MaxRequestAmplification          int
104                 MaxRequestSize                   int
105                 MaxTokenLifetime                 Duration
106                 RequestTimeout                   Duration
107                 SendTimeout                      Duration
108                 WebsocketClientEventQueue        int
109                 WebsocketServerEventQueue        int
110                 KeepServiceRequestTimeout        Duration
111                 VocabularyPath                   string
112                 FreezeProjectRequiresDescription bool
113                 FreezeProjectRequiresProperties  StringSet
114                 UnfreezeProjectRequiresAdmin     bool
115         }
116         AuditLogs struct {
117                 MaxAge             Duration
118                 MaxDeleteBatch     int
119                 UnloggedAttributes StringSet
120         }
121         Collections struct {
122                 BlobSigning                  bool
123                 BlobSigningKey               string
124                 BlobSigningTTL               Duration
125                 BlobTrash                    bool
126                 BlobTrashLifetime            Duration
127                 BlobTrashCheckInterval       Duration
128                 BlobTrashConcurrency         int
129                 BlobDeleteConcurrency        int
130                 BlobReplicateConcurrency     int
131                 CollectionVersioning         bool
132                 DefaultTrashLifetime         Duration
133                 DefaultReplication           int
134                 ManagedProperties            ManagedProperties
135                 PreserveVersionIfIdle        Duration
136                 TrashSweepInterval           Duration
137                 TrustAllContent              bool
138                 ForwardSlashNameSubstitution string
139                 S3FolderObjects              bool
140
141                 BlobMissingReport        string
142                 BalancePeriod            Duration
143                 BalanceCollectionBatch   int
144                 BalanceCollectionBuffers int
145                 BalanceTimeout           Duration
146                 BalanceUpdateLimit       int
147
148                 WebDAVCache WebDAVCacheConfig
149
150                 KeepproxyPermission UploadDownloadRolePermissions
151                 WebDAVPermission    UploadDownloadRolePermissions
152                 WebDAVLogEvents     bool
153         }
154         Git struct {
155                 GitCommand   string
156                 GitoliteHome string
157                 Repositories string
158         }
159         Login struct {
160                 LDAP struct {
161                         Enable             bool
162                         URL                URL
163                         StartTLS           bool
164                         InsecureTLS        bool
165                         StripDomain        string
166                         AppendDomain       string
167                         SearchAttribute    string
168                         SearchBindUser     string
169                         SearchBindPassword string
170                         SearchBase         string
171                         SearchFilters      string
172                         EmailAttribute     string
173                         UsernameAttribute  string
174                 }
175                 Google struct {
176                         Enable                          bool
177                         ClientID                        string
178                         ClientSecret                    string
179                         AlternateEmailAddresses         bool
180                         AuthenticationRequestParameters map[string]string
181                 }
182                 OpenIDConnect struct {
183                         Enable                          bool
184                         Issuer                          string
185                         ClientID                        string
186                         ClientSecret                    string
187                         EmailClaim                      string
188                         EmailVerifiedClaim              string
189                         UsernameClaim                   string
190                         AcceptAccessToken               bool
191                         AcceptAccessTokenScope          string
192                         AuthenticationRequestParameters map[string]string
193                 }
194                 PAM struct {
195                         Enable             bool
196                         Service            string
197                         DefaultEmailDomain string
198                 }
199                 Test struct {
200                         Enable bool
201                         Users  map[string]TestUser
202                 }
203                 LoginCluster         string
204                 RemoteTokenRefresh   Duration
205                 TokenLifetime        Duration
206                 TrustedClients       map[URL]struct{}
207                 TrustPrivateNetworks bool
208                 IssueTrustedTokens   bool
209         }
210         Mail struct {
211                 MailchimpAPIKey                string
212                 MailchimpListID                string
213                 SendUserSetupNotificationEmail bool
214                 IssueReporterEmailFrom         string
215                 IssueReporterEmailTo           string
216                 SupportEmailAddress            string
217                 EmailFrom                      string
218         }
219         SystemLogs struct {
220                 LogLevel                string
221                 Format                  string
222                 MaxRequestLogParamsSize int
223         }
224         TLS struct {
225                 Certificate string
226                 Key         string
227                 Insecure    bool
228                 ACME        struct {
229                         Server string
230                 }
231         }
232         Users struct {
233                 ActivatedUsersAreVisibleToOthers      bool
234                 AnonymousUserToken                    string
235                 AdminNotifierEmailFrom                string
236                 AutoAdminFirstUser                    bool
237                 AutoAdminUserWithEmail                string
238                 AutoSetupNewUsers                     bool
239                 AutoSetupNewUsersWithRepository       bool
240                 AutoSetupNewUsersWithVmUUID           string
241                 AutoSetupUsernameBlacklist            StringSet
242                 EmailSubjectPrefix                    string
243                 NewInactiveUserNotificationRecipients StringSet
244                 NewUserNotificationRecipients         StringSet
245                 NewUsersAreActive                     bool
246                 UserNotifierEmailFrom                 string
247                 UserNotifierEmailBcc                  StringSet
248                 UserProfileNotificationAddress        string
249                 PreferDomainForUsername               string
250                 UserSetupMailText                     string
251                 RoleGroupsVisibleToAll                bool
252                 CanCreateRoleGroups                   bool
253                 ActivityLoggingPeriod                 Duration
254         }
255         StorageClasses map[string]StorageClassConfig
256         Volumes        map[string]Volume
257         Workbench      struct {
258                 ActivationContactLink            string
259                 APIClientConnectTimeout          Duration
260                 APIClientReceiveTimeout          Duration
261                 APIResponseCompression           bool
262                 ApplicationMimetypesWithViewIcon StringSet
263                 ArvadosDocsite                   string
264                 ArvadosPublicDataDocURL          string
265                 DefaultOpenIdPrefix              string
266                 DisableSharingURLsUI             bool
267                 EnableGettingStartedPopup        bool
268                 EnablePublicProjectsPage         bool
269                 FileViewersConfigURL             string
270                 LogViewerMaxBytes                ByteSize
271                 MultiSiteSearch                  string
272                 ProfilingEnabled                 bool
273                 Repositories                     bool
274                 RepositoryCache                  string
275                 RunningJobLogRecordsToFetch      int
276                 SecretKeyBase                    string
277                 ShowRecentCollectionsOnDashboard bool
278                 ShowUserAgreementInline          bool
279                 ShowUserNotifications            bool
280                 SiteName                         string
281                 Theme                            string
282                 UserProfileFormFields            map[string]struct {
283                         Type                 string
284                         FormFieldTitle       string
285                         FormFieldDescription string
286                         Required             bool
287                         Position             int
288                         Options              map[string]struct{}
289                 }
290                 UserProfileFormMessage string
291                 WelcomePageHTML        string
292                 InactivePageHTML       string
293                 SSHHelpPageHTML        string
294                 SSHHelpHostSuffix      string
295                 IdleTimeout            Duration
296                 BannerURL              string
297         }
298 }
299
300 type StorageClassConfig struct {
301         Default  bool
302         Priority int
303 }
304
305 type Volume struct {
306         AccessViaHosts   map[URL]VolumeAccess
307         ReadOnly         bool
308         Replication      int
309         StorageClasses   map[string]bool
310         Driver           string
311         DriverParameters json.RawMessage
312 }
313
314 type S3VolumeDriverParameters struct {
315         IAMRole            string
316         AccessKeyID        string
317         SecretAccessKey    string
318         Endpoint           string
319         Region             string
320         Bucket             string
321         LocationConstraint bool
322         V2Signature        bool
323         UseAWSS3v2Driver   bool
324         IndexPageSize      int
325         ConnectTimeout     Duration
326         ReadTimeout        Duration
327         RaceWindow         Duration
328         UnsafeDelete       bool
329         PrefixLength       int
330 }
331
332 type AzureVolumeDriverParameters struct {
333         StorageAccountName   string
334         StorageAccountKey    string
335         StorageBaseURL       string
336         ContainerName        string
337         RequestTimeout       Duration
338         ListBlobsRetryDelay  Duration
339         ListBlobsMaxAttempts int
340 }
341
342 type DirectoryVolumeDriverParameters struct {
343         Root      string
344         Serialize bool
345 }
346
347 type VolumeAccess struct {
348         ReadOnly bool
349 }
350
351 type Services struct {
352         Composer       Service
353         Controller     Service
354         DispatchCloud  Service
355         DispatchLSF    Service
356         DispatchSLURM  Service
357         GitHTTP        Service
358         GitSSH         Service
359         Health         Service
360         Keepbalance    Service
361         Keepproxy      Service
362         Keepstore      Service
363         RailsAPI       Service
364         WebDAVDownload Service
365         WebDAV         Service
366         WebShell       Service
367         Websocket      Service
368         Workbench1     Service
369         Workbench2     Service
370 }
371
372 type Service struct {
373         InternalURLs map[URL]ServiceInstance
374         ExternalURL  URL
375 }
376
377 type TestUser struct {
378         Email    string
379         Password string
380 }
381
382 // URL is a url.URL that is also usable as a JSON key/value.
383 type URL url.URL
384
385 // UnmarshalText implements encoding.TextUnmarshaler so URL can be
386 // used as a JSON key/value.
387 func (su *URL) UnmarshalText(text []byte) error {
388         u, err := url.Parse(string(text))
389         if err == nil {
390                 *su = URL(*u)
391                 if su.Path == "" && su.Host != "" {
392                         // http://example really means http://example/
393                         su.Path = "/"
394                 }
395         }
396         return err
397 }
398
399 func (su URL) MarshalText() ([]byte, error) {
400         return []byte(su.String()), nil
401 }
402
403 func (su URL) String() string {
404         return (*url.URL)(&su).String()
405 }
406
407 type ServiceInstance struct {
408         ListenURL  URL
409         Rendezvous string `json:",omitempty"`
410 }
411
412 type PostgreSQL struct {
413         Connection     PostgreSQLConnection
414         ConnectionPool int
415 }
416
417 type PostgreSQLConnection map[string]string
418
419 type RemoteCluster struct {
420         Host          string
421         Proxy         bool
422         Scheme        string
423         Insecure      bool
424         ActivateUsers bool
425 }
426
427 type CUDAFeatures struct {
428         DriverVersion      string
429         HardwareCapability string
430         DeviceCount        int
431 }
432
433 type InstanceType struct {
434         Name            string `json:"-"`
435         ProviderType    string
436         VCPUs           int
437         RAM             ByteSize
438         Scratch         ByteSize `json:"-"`
439         IncludedScratch ByteSize
440         AddedScratch    ByteSize
441         Price           float64
442         Preemptible     bool
443         CUDA            CUDAFeatures
444 }
445
446 type ContainersConfig struct {
447         CloudVMs                      CloudVMsConfig
448         CrunchRunCommand              string
449         CrunchRunArgumentsList        []string
450         DefaultKeepCacheRAM           ByteSize
451         DispatchPrivateKey            string
452         LogReuseDecisions             bool
453         MaxComputeVMs                 int
454         MaxDispatchAttempts           int
455         MaxRetryAttempts              int
456         MinRetryPeriod                Duration
457         ReserveExtraRAM               ByteSize
458         StaleLockTimeout              Duration
459         SupportedDockerImageFormats   StringSet
460         AlwaysUsePreemptibleInstances bool
461         PreemptiblePriceFactor        float64
462         RuntimeEngine                 string
463         LocalKeepBlobBuffersPerVCPU   int
464         LocalKeepLogsToContainerLog   string
465
466         JobsAPI struct {
467                 Enable         string
468                 GitInternalDir string
469         }
470         Logging struct {
471                 MaxAge                       Duration
472                 SweepInterval                Duration
473                 LogBytesPerEvent             int
474                 LogSecondsBetweenEvents      Duration
475                 LogThrottlePeriod            Duration
476                 LogThrottleBytes             int
477                 LogThrottleLines             int
478                 LimitLogBytesPerJob          int
479                 LogPartialLineThrottlePeriod Duration
480                 LogUpdatePeriod              Duration
481                 LogUpdateSize                ByteSize
482         }
483         ShellAccess struct {
484                 Admin bool
485                 User  bool
486         }
487         SLURM struct {
488                 PrioritySpread             int64
489                 SbatchArgumentsList        []string
490                 SbatchEnvironmentVariables map[string]string
491                 Managed                    struct {
492                         DNSServerConfDir       string
493                         DNSServerConfTemplate  string
494                         DNSServerReloadCommand string
495                         DNSServerUpdateCommand string
496                         ComputeNodeDomain      string
497                         ComputeNodeNameservers StringSet
498                         AssignNodeHostname     string
499                 }
500         }
501         LSF struct {
502                 BsubSudoUser      string
503                 BsubArgumentsList []string
504                 BsubCUDAArguments []string
505         }
506 }
507
508 type CloudVMsConfig struct {
509         Enable bool
510
511         BootProbeCommand               string
512         DeployRunnerBinary             string
513         ImageID                        string
514         MaxCloudOpsPerSecond           int
515         MaxProbesPerSecond             int
516         MaxConcurrentInstanceCreateOps int
517         PollInterval                   Duration
518         ProbeInterval                  Duration
519         SSHPort                        string
520         SyncInterval                   Duration
521         TimeoutBooting                 Duration
522         TimeoutIdle                    Duration
523         TimeoutProbe                   Duration
524         TimeoutShutdown                Duration
525         TimeoutSignal                  Duration
526         TimeoutStaleRunLock            Duration
527         TimeoutTERM                    Duration
528         ResourceTags                   map[string]string
529         TagKeyPrefix                   string
530
531         Driver           string
532         DriverParameters json.RawMessage
533 }
534
535 type InstanceTypeMap map[string]InstanceType
536
537 var errDuplicateInstanceTypeName = errors.New("duplicate instance type name")
538
539 // UnmarshalJSON does special handling of InstanceTypes:
540 //
541 // - populate computed fields (Name and Scratch)
542 //
543 // - error out if InstancesTypes are populated as an array, which was
544 // deprecated in Arvados 1.2.0
545 func (it *InstanceTypeMap) UnmarshalJSON(data []byte) error {
546         fixup := func(t InstanceType) (InstanceType, error) {
547                 if t.ProviderType == "" {
548                         t.ProviderType = t.Name
549                 }
550                 // If t.Scratch is set in the configuration file, it will be ignored and overwritten.
551                 // It will also generate a "deprecated or unknown config entry" warning.
552                 t.Scratch = t.IncludedScratch + t.AddedScratch
553                 return t, nil
554         }
555
556         if len(data) > 0 && data[0] == '[' {
557                 return fmt.Errorf("InstanceTypes must be specified as a map, not an array, see https://doc.arvados.org/admin/config.html")
558         }
559         var hash map[string]InstanceType
560         err := json.Unmarshal(data, &hash)
561         if err != nil {
562                 return err
563         }
564         // Fill in Name field (and ProviderType field, if not
565         // specified) using hash key.
566         *it = InstanceTypeMap(hash)
567         for name, t := range *it {
568                 t.Name = name
569                 t, err := fixup(t)
570                 if err != nil {
571                         return err
572                 }
573                 (*it)[name] = t
574         }
575         return nil
576 }
577
578 type StringSet map[string]struct{}
579
580 // UnmarshalJSON handles old config files that provide an array of
581 // instance types instead of a hash.
582 func (ss *StringSet) UnmarshalJSON(data []byte) error {
583         if len(data) > 0 && data[0] == '[' {
584                 var arr []string
585                 err := json.Unmarshal(data, &arr)
586                 if err != nil {
587                         return err
588                 }
589                 if len(arr) == 0 {
590                         *ss = nil
591                         return nil
592                 }
593                 *ss = make(map[string]struct{}, len(arr))
594                 for _, t := range arr {
595                         (*ss)[t] = struct{}{}
596                 }
597                 return nil
598         }
599         var hash map[string]struct{}
600         err := json.Unmarshal(data, &hash)
601         if err != nil {
602                 return err
603         }
604         *ss = make(map[string]struct{}, len(hash))
605         for t := range hash {
606                 (*ss)[t] = struct{}{}
607         }
608
609         return nil
610 }
611
612 type ServiceName string
613
614 const (
615         ServiceNameController    ServiceName = "arvados-controller"
616         ServiceNameDispatchCloud ServiceName = "arvados-dispatch-cloud"
617         ServiceNameDispatchLSF   ServiceName = "arvados-dispatch-lsf"
618         ServiceNameDispatchSLURM ServiceName = "crunch-dispatch-slurm"
619         ServiceNameGitHTTP       ServiceName = "arvados-git-httpd"
620         ServiceNameHealth        ServiceName = "arvados-health"
621         ServiceNameKeepbalance   ServiceName = "keep-balance"
622         ServiceNameKeepproxy     ServiceName = "keepproxy"
623         ServiceNameKeepstore     ServiceName = "keepstore"
624         ServiceNameKeepweb       ServiceName = "keep-web"
625         ServiceNameRailsAPI      ServiceName = "arvados-api-server"
626         ServiceNameWebsocket     ServiceName = "arvados-ws"
627         ServiceNameWorkbench1    ServiceName = "arvados-workbench1"
628         ServiceNameWorkbench2    ServiceName = "arvados-workbench2"
629 )
630
631 // Map returns all services as a map, suitable for iterating over all
632 // services or looking up a service by name.
633 func (svcs Services) Map() map[ServiceName]Service {
634         return map[ServiceName]Service{
635                 ServiceNameController:    svcs.Controller,
636                 ServiceNameDispatchCloud: svcs.DispatchCloud,
637                 ServiceNameDispatchLSF:   svcs.DispatchLSF,
638                 ServiceNameDispatchSLURM: svcs.DispatchSLURM,
639                 ServiceNameGitHTTP:       svcs.GitHTTP,
640                 ServiceNameHealth:        svcs.Health,
641                 ServiceNameKeepbalance:   svcs.Keepbalance,
642                 ServiceNameKeepproxy:     svcs.Keepproxy,
643                 ServiceNameKeepstore:     svcs.Keepstore,
644                 ServiceNameKeepweb:       svcs.WebDAV,
645                 ServiceNameRailsAPI:      svcs.RailsAPI,
646                 ServiceNameWebsocket:     svcs.Websocket,
647                 ServiceNameWorkbench1:    svcs.Workbench1,
648                 ServiceNameWorkbench2:    svcs.Workbench2,
649         }
650 }