Merge branch '18184-singularity-374'
[arvados.git] / services / api / config / arvados_config.rb
1 # Copyright (C) The Arvados Authors. All rights reserved.
2 #
3 # SPDX-License-Identifier: AGPL-3.0
4
5 #
6 # Load Arvados configuration from /etc/arvados/config.yml, using defaults
7 # from config.default.yml
8 #
9 # Existing application.yml is migrated into the new config structure.
10 # Keys in the legacy application.yml take precedence.
11 #
12 # Use "bundle exec config:dump" to get the complete active configuration
13 #
14 # Use "bundle exec config:migrate" to migrate application.yml and
15 # database.yml to config.yml.  After adding the output of
16 # config:migrate to /etc/arvados/config.yml, you will be able to
17 # delete application.yml and database.yml.
18
19 require "cgi"
20 require 'config_loader'
21 require 'open3'
22
23 begin
24   # If secret_token.rb exists here, we need to load it first.
25   require_relative 'secret_token.rb'
26 rescue LoadError
27   # Normally secret_token.rb is missing and the secret token is
28   # configured by application.yml (i.e., here!) instead.
29 end
30
31 # Load the defaults, used by config:migrate and fallback loading
32 # legacy application.yml
33 defaultYAML, stderr, status = Open3.capture3("arvados-server", "config-dump", "-config=-", "-skip-legacy", stdin_data: "Clusters: {xxxxx: {}}")
34 if !status.success?
35   puts stderr
36   raise "error loading config: #{status}"
37 end
38 confs = YAML.load(defaultYAML, deserialize_symbols: false)
39 clusterID, clusterConfig = confs["Clusters"].first
40 $arvados_config_defaults = clusterConfig
41 $arvados_config_defaults["ClusterID"] = clusterID
42
43 if ENV["ARVADOS_CONFIG"] == "none"
44   # Don't load config. This magic value is set by packaging scripts so
45   # they can run "rake assets:precompile" without a real config.
46   $arvados_config_global = $arvados_config_defaults.deep_dup
47 else
48   # Load the global config file
49   Open3.popen2("arvados-server", "config-dump", "-skip-legacy") do |stdin, stdout, status_thread|
50     confs = YAML.load(stdout, deserialize_symbols: false)
51     if confs && !confs.empty?
52       # config-dump merges defaults with user configuration, so every
53       # key should be set.
54       clusterID, clusterConfig = confs["Clusters"].first
55       $arvados_config_global = clusterConfig
56       $arvados_config_global["ClusterID"] = clusterID
57     else
58       # config-dump failed, assume we will be loading from legacy
59       # application.yml, initialize with defaults.
60       $arvados_config_global = $arvados_config_defaults.deep_dup
61     end
62   end
63 end
64
65 # Now make a copy
66 $arvados_config = $arvados_config_global.deep_dup
67
68 def arrayToHash cfg, k, v
69   val = {}
70   v.each do |entry|
71     val[entry.to_s] = {}
72   end
73   ConfigLoader.set_cfg cfg, k, val
74 end
75
76 # Declare all our configuration items.
77 arvcfg = ConfigLoader.new
78 arvcfg.declare_config "ClusterID", NonemptyString, :uuid_prefix
79 arvcfg.declare_config "ManagementToken", String, :ManagementToken
80 arvcfg.declare_config "SystemRootToken", String
81 arvcfg.declare_config "Git.Repositories", String, :git_repositories_dir
82 arvcfg.declare_config "API.DisabledAPIs", Hash, :disable_api_methods, ->(cfg, k, v) { arrayToHash cfg, "API.DisabledAPIs", v }
83 arvcfg.declare_config "API.MaxRequestSize", Integer, :max_request_size
84 arvcfg.declare_config "API.MaxIndexDatabaseRead", Integer, :max_index_database_read
85 arvcfg.declare_config "API.MaxItemsPerResponse", Integer, :max_items_per_response
86 arvcfg.declare_config "API.MaxTokenLifetime", ActiveSupport::Duration
87 arvcfg.declare_config "API.RequestTimeout", ActiveSupport::Duration
88 arvcfg.declare_config "API.AsyncPermissionsUpdateInterval", ActiveSupport::Duration, :async_permissions_update_interval
89 arvcfg.declare_config "Users.AutoSetupNewUsers", Boolean, :auto_setup_new_users
90 arvcfg.declare_config "Users.AutoSetupNewUsersWithVmUUID", String, :auto_setup_new_users_with_vm_uuid
91 arvcfg.declare_config "Users.AutoSetupNewUsersWithRepository", Boolean, :auto_setup_new_users_with_repository
92 arvcfg.declare_config "Users.AutoSetupUsernameBlacklist", Hash, :auto_setup_name_blacklist, ->(cfg, k, v) { arrayToHash cfg, "Users.AutoSetupUsernameBlacklist", v }
93 arvcfg.declare_config "Users.NewUsersAreActive", Boolean, :new_users_are_active
94 arvcfg.declare_config "Users.AutoAdminUserWithEmail", String, :auto_admin_user
95 arvcfg.declare_config "Users.AutoAdminFirstUser", Boolean, :auto_admin_first_user
96 arvcfg.declare_config "Users.UserProfileNotificationAddress", String, :user_profile_notification_address
97 arvcfg.declare_config "Users.AdminNotifierEmailFrom", String, :admin_notifier_email_from
98 arvcfg.declare_config "Users.EmailSubjectPrefix", String, :email_subject_prefix
99 arvcfg.declare_config "Users.UserNotifierEmailFrom", String, :user_notifier_email_from
100 arvcfg.declare_config "Users.UserNotifierEmailBcc", Hash
101 arvcfg.declare_config "Users.NewUserNotificationRecipients", Hash, :new_user_notification_recipients, ->(cfg, k, v) { arrayToHash cfg, "Users.NewUserNotificationRecipients", v }
102 arvcfg.declare_config "Users.NewInactiveUserNotificationRecipients", Hash, :new_inactive_user_notification_recipients, method(:arrayToHash)
103 arvcfg.declare_config "Login.LoginCluster", String
104 arvcfg.declare_config "Login.TrustedClients", Hash
105 arvcfg.declare_config "Login.RemoteTokenRefresh", ActiveSupport::Duration
106 arvcfg.declare_config "Login.TokenLifetime", ActiveSupport::Duration
107 arvcfg.declare_config "TLS.Insecure", Boolean, :sso_insecure
108 arvcfg.declare_config "AuditLogs.MaxAge", ActiveSupport::Duration, :max_audit_log_age
109 arvcfg.declare_config "AuditLogs.MaxDeleteBatch", Integer, :max_audit_log_delete_batch
110 arvcfg.declare_config "AuditLogs.UnloggedAttributes", Hash, :unlogged_attributes, ->(cfg, k, v) { arrayToHash cfg, "AuditLogs.UnloggedAttributes", v }
111 arvcfg.declare_config "SystemLogs.MaxRequestLogParamsSize", Integer, :max_request_log_params_size
112 arvcfg.declare_config "Collections.DefaultReplication", Integer, :default_collection_replication
113 arvcfg.declare_config "Collections.DefaultTrashLifetime", ActiveSupport::Duration, :default_trash_lifetime
114 arvcfg.declare_config "Collections.CollectionVersioning", Boolean, :collection_versioning
115 arvcfg.declare_config "Collections.PreserveVersionIfIdle", ActiveSupport::Duration, :preserve_version_if_idle
116 arvcfg.declare_config "Collections.TrashSweepInterval", ActiveSupport::Duration, :trash_sweep_interval
117 arvcfg.declare_config "Collections.BlobSigningKey", String, :blob_signing_key
118 arvcfg.declare_config "Collections.BlobSigningTTL", ActiveSupport::Duration, :blob_signature_ttl
119 arvcfg.declare_config "Collections.BlobSigning", Boolean, :permit_create_collection_with_unsigned_manifest, ->(cfg, k, v) { ConfigLoader.set_cfg cfg, "Collections.BlobSigning", !v }
120 arvcfg.declare_config "Collections.ForwardSlashNameSubstitution", String
121 arvcfg.declare_config "Containers.SupportedDockerImageFormats", Hash, :docker_image_formats, ->(cfg, k, v) { arrayToHash cfg, "Containers.SupportedDockerImageFormats", v }
122 arvcfg.declare_config "Containers.LogReuseDecisions", Boolean, :log_reuse_decisions
123 arvcfg.declare_config "Containers.DefaultKeepCacheRAM", Integer, :container_default_keep_cache_ram
124 arvcfg.declare_config "Containers.MaxDispatchAttempts", Integer, :max_container_dispatch_attempts
125 arvcfg.declare_config "Containers.MaxRetryAttempts", Integer, :container_count_max
126 arvcfg.declare_config "Containers.UsePreemptibleInstances", Boolean, :preemptible_instances
127 arvcfg.declare_config "Containers.MaxComputeVMs", Integer, :max_compute_nodes
128 arvcfg.declare_config "Containers.Logging.LogBytesPerEvent", Integer, :crunch_log_bytes_per_event
129 arvcfg.declare_config "Containers.Logging.LogSecondsBetweenEvents", ActiveSupport::Duration, :crunch_log_seconds_between_events
130 arvcfg.declare_config "Containers.Logging.LogThrottlePeriod", ActiveSupport::Duration, :crunch_log_throttle_period
131 arvcfg.declare_config "Containers.Logging.LogThrottleBytes", Integer, :crunch_log_throttle_bytes
132 arvcfg.declare_config "Containers.Logging.LogThrottleLines", Integer, :crunch_log_throttle_lines
133 arvcfg.declare_config "Containers.Logging.LimitLogBytesPerJob", Integer, :crunch_limit_log_bytes_per_job
134 arvcfg.declare_config "Containers.Logging.LogPartialLineThrottlePeriod", ActiveSupport::Duration, :crunch_log_partial_line_throttle_period
135 arvcfg.declare_config "Containers.Logging.LogUpdatePeriod", ActiveSupport::Duration, :crunch_log_update_period
136 arvcfg.declare_config "Containers.Logging.LogUpdateSize", Integer, :crunch_log_update_size
137 arvcfg.declare_config "Containers.Logging.MaxAge", ActiveSupport::Duration, :clean_container_log_rows_after
138 arvcfg.declare_config "Containers.SLURM.Managed.DNSServerConfDir", Pathname, :dns_server_conf_dir
139 arvcfg.declare_config "Containers.SLURM.Managed.DNSServerConfTemplate", Pathname, :dns_server_conf_template
140 arvcfg.declare_config "Containers.SLURM.Managed.DNSServerReloadCommand", String, :dns_server_reload_command
141 arvcfg.declare_config "Containers.SLURM.Managed.DNSServerUpdateCommand", String, :dns_server_update_command
142 arvcfg.declare_config "Containers.SLURM.Managed.ComputeNodeDomain", String, :compute_node_domain
143 arvcfg.declare_config "Containers.SLURM.Managed.ComputeNodeNameservers", Hash, :compute_node_nameservers, ->(cfg, k, v) { arrayToHash cfg, "Containers.SLURM.Managed.ComputeNodeNameservers", v }
144 arvcfg.declare_config "Containers.SLURM.Managed.AssignNodeHostname", String, :assign_node_hostname
145 arvcfg.declare_config "Containers.JobsAPI.Enable", String, :enable_legacy_jobs_api, ->(cfg, k, v) { ConfigLoader.set_cfg cfg, "Containers.JobsAPI.Enable", v.to_s }
146 arvcfg.declare_config "Containers.JobsAPI.GitInternalDir", String, :git_internal_dir
147 arvcfg.declare_config "Mail.MailchimpAPIKey", String, :mailchimp_api_key
148 arvcfg.declare_config "Mail.MailchimpListID", String, :mailchimp_list_id
149 arvcfg.declare_config "Services.Controller.ExternalURL", URI
150 arvcfg.declare_config "Services.Workbench1.ExternalURL", URI, :workbench_address
151 arvcfg.declare_config "Services.Websocket.ExternalURL", URI, :websocket_address
152 arvcfg.declare_config "Services.WebDAV.ExternalURL", URI, :keep_web_service_url
153 arvcfg.declare_config "Services.GitHTTP.ExternalURL", URI, :git_repo_https_base
154 arvcfg.declare_config "Services.GitSSH.ExternalURL", URI, :git_repo_ssh_base, ->(cfg, k, v) { ConfigLoader.set_cfg cfg, "Services.GitSSH.ExternalURL", "ssh://#{v}" }
155 arvcfg.declare_config "RemoteClusters", Hash, :remote_hosts, ->(cfg, k, v) {
156   h = if cfg["RemoteClusters"] then
157         cfg["RemoteClusters"].deep_dup
158       else
159         {}
160       end
161   v.each do |clusterid, host|
162     if h[clusterid].nil?
163       h[clusterid] = {
164         "Host" => host,
165         "Proxy" => true,
166         "Scheme" => "https",
167         "Insecure" => false,
168         "ActivateUsers" => false
169       }
170     end
171   end
172   ConfigLoader.set_cfg cfg, "RemoteClusters", h
173 }
174 arvcfg.declare_config "RemoteClusters.*.Proxy", Boolean, :remote_hosts_via_dns
175 arvcfg.declare_config "StorageClasses", Hash
176
177 dbcfg = ConfigLoader.new
178
179 dbcfg.declare_config "PostgreSQL.ConnectionPool", Integer, :pool
180 dbcfg.declare_config "PostgreSQL.Connection.host", String, :host
181 dbcfg.declare_config "PostgreSQL.Connection.port", String, :port
182 dbcfg.declare_config "PostgreSQL.Connection.user", String, :username
183 dbcfg.declare_config "PostgreSQL.Connection.password", String, :password
184 dbcfg.declare_config "PostgreSQL.Connection.dbname", String, :database
185 dbcfg.declare_config "PostgreSQL.Connection.template", String, :template
186 dbcfg.declare_config "PostgreSQL.Connection.encoding", String, :encoding
187 dbcfg.declare_config "PostgreSQL.Connection.collation", String, :collation
188
189 application_config = {}
190 %w(application.default application).each do |cfgfile|
191   path = "#{::Rails.root.to_s}/config/#{cfgfile}.yml"
192   confs = ConfigLoader.load(path, erb: true)
193   # Ignore empty YAML file:
194   next if confs == false
195   application_config.deep_merge!(confs['common'] || {})
196   application_config.deep_merge!(confs[::Rails.env.to_s] || {})
197 end
198
199 db_config = {}
200 path = "#{::Rails.root.to_s}/config/database.yml"
201 if !ENV['ARVADOS_CONFIG_NOLEGACY'] && File.exist?(path)
202   db_config = ConfigLoader.load(path, erb: true)
203 end
204
205 $remaining_config = arvcfg.migrate_config(application_config, $arvados_config)
206 dbcfg.migrate_config(db_config[::Rails.env.to_s] || {}, $arvados_config)
207
208 if application_config[:auto_activate_users_from]
209   application_config[:auto_activate_users_from].each do |cluster|
210     if $arvados_config.RemoteClusters[cluster]
211       $arvados_config.RemoteClusters[cluster]["ActivateUsers"] = true
212     end
213   end
214 end
215
216 if application_config[:host] || application_config[:port] || application_config[:scheme]
217   if !application_config[:host] || application_config[:host].empty?
218     raise "Must set 'host' when setting 'port' or 'scheme'"
219   end
220   $arvados_config.Services["Controller"]["ExternalURL"] = URI((application_config[:scheme] || "https")+"://"+application_config[:host]+
221                                                               (if application_config[:port] then ":#{application_config[:port]}" else "" end))
222 end
223
224 # Checks for wrongly typed configuration items, coerces properties
225 # into correct types (such as Duration), and optionally raise error
226 # for essential configuration that can't be empty.
227 arvcfg.coercion_and_check $arvados_config_defaults, check_nonempty: false
228 arvcfg.coercion_and_check $arvados_config_global, check_nonempty: false
229 arvcfg.coercion_and_check $arvados_config, check_nonempty: true
230 dbcfg.coercion_and_check $arvados_config, check_nonempty: true
231
232 # * $arvados_config_defaults is the defaults
233 # * $arvados_config_global is $arvados_config_defaults merged with the contents of /etc/arvados/config.yml
234 # These are used by the rake config: tasks
235 #
236 # * $arvados_config is $arvados_config_global merged with the migrated contents of application.yml
237 # This is what actually gets copied into the Rails configuration object.
238
239 if $arvados_config["Collections"]["DefaultTrashLifetime"] < 86400.seconds then
240   raise "default_trash_lifetime is %d, must be at least 86400" % Rails.configuration.Collections.DefaultTrashLifetime
241 end
242
243 default_storage_classes = []
244 $arvados_config["StorageClasses"].each do |cls, cfg|
245   if cfg["Default"]
246     default_storage_classes << cls
247   end
248 end
249 if default_storage_classes.length == 0
250   default_storage_classes = ["default"]
251 end
252 $arvados_config["DefaultStorageClasses"] = default_storage_classes.sort
253
254 #
255 # Special case for test database where there's no database.yml,
256 # because the Arvados config.yml doesn't have a concept of multiple
257 # rails environments.
258 #
259 if ::Rails.env.to_s == "test" && db_config["test"].nil?
260   $arvados_config["PostgreSQL"]["Connection"]["dbname"] = "arvados_test"
261 end
262 if ::Rails.env.to_s == "test"
263   # Use template0 when creating a new database. Avoids
264   # character-encoding/collation problems.
265   $arvados_config["PostgreSQL"]["Connection"]["template"] = "template0"
266   # Some test cases depend on en_US.UTF-8 collation.
267   $arvados_config["PostgreSQL"]["Connection"]["collation"] = "en_US.UTF-8"
268 end
269
270 if ENV["ARVADOS_CONFIG"] == "none"
271   # We need the postgresql connection URI to be valid, even if we
272   # don't use it.
273   $arvados_config["PostgreSQL"]["Connection"]["host"] = "localhost"
274   $arvados_config["PostgreSQL"]["Connection"]["user"] = "x"
275   $arvados_config["PostgreSQL"]["Connection"]["password"] = "x"
276   $arvados_config["PostgreSQL"]["Connection"]["dbname"] = "x"
277 end
278
279 if $arvados_config["PostgreSQL"]["Connection"]["password"].empty?
280   raise "Database password is empty, PostgreSQL section is: #{$arvados_config["PostgreSQL"]}"
281 end
282
283 dbhost = $arvados_config["PostgreSQL"]["Connection"]["host"]
284 if $arvados_config["PostgreSQL"]["Connection"]["port"] != 0
285   dbhost += ":#{$arvados_config["PostgreSQL"]["Connection"]["port"]}"
286 end
287
288 #
289 # If DATABASE_URL is set, then ActiveRecord won't error out if database.yml doesn't exist.
290 #
291 # For config migration, we've previously populated the PostgreSQL
292 # section of the config from database.yml
293 #
294 database_url = "postgresql://#{CGI.escape $arvados_config["PostgreSQL"]["Connection"]["user"]}:"+
295                       "#{CGI.escape $arvados_config["PostgreSQL"]["Connection"]["password"]}@"+
296                       "#{dbhost}/#{CGI.escape $arvados_config["PostgreSQL"]["Connection"]["dbname"]}?"+
297                       "template=#{$arvados_config["PostgreSQL"]["Connection"]["template"]}&"+
298                       "encoding=#{$arvados_config["PostgreSQL"]["Connection"]["client_encoding"]}&"+
299                       "collation=#{$arvados_config["PostgreSQL"]["Connection"]["collation"]}&"+
300                       "pool=#{$arvados_config["PostgreSQL"]["ConnectionPool"]}"
301
302 ENV["DATABASE_URL"] = database_url
303
304 Server::Application.configure do
305   # Copy into the Rails config object.  This also turns Hash into
306   # OrderedOptions so that application code can use
307   # Rails.configuration.API.Blah instead of
308   # Rails.configuration.API["Blah"]
309   ConfigLoader.copy_into_config $arvados_config, config
310   ConfigLoader.copy_into_config $remaining_config, config
311
312   # We don't rely on cookies for authentication, so instead of
313   # requiring a signing key in config, we assign a new random one at
314   # startup.
315   secrets.secret_key_base = rand(1<<255).to_s(36)
316 end