Merge branch '21290-sync-past-versions' refs #21290
[arvados.git] / services / api / config / arvados_config.rb
1 # Copyright (C) The Arvados Authors. All rights reserved.
2 #
3 # SPDX-License-Identifier: AGPL-3.0
4
5 #
6 # Load Arvados configuration from /etc/arvados/config.yml, using defaults
7 # from config.default.yml
8 #
9 # Existing application.yml is migrated into the new config structure.
10 # Keys in the legacy application.yml take precedence.
11 #
12 # Use "bundle exec config:dump" to get the complete active configuration
13 #
14 # Use "bundle exec config:migrate" to migrate application.yml and
15 # database.yml to config.yml.  After adding the output of
16 # config:migrate to /etc/arvados/config.yml, you will be able to
17 # delete application.yml and database.yml.
18
19 require "cgi"
20 require 'config_loader'
21 require 'open3'
22
23 begin
24   # If secret_token.rb exists here, we need to load it first.
25   require_relative 'secret_token.rb'
26 rescue LoadError
27   # Normally secret_token.rb is missing and the secret token is
28   # configured by application.yml (i.e., here!) instead.
29 end
30
31 # Load the defaults, used by config:migrate and fallback loading
32 # legacy application.yml
33 load_time = Time.now.utc
34 defaultYAML, stderr, status = Open3.capture3("arvados-server", "config-dump", "-config=-", "-skip-legacy", stdin_data: "Clusters: {xxxxx: {}}")
35 if !status.success?
36   puts stderr
37   raise "error loading config: #{status}"
38 end
39 confs = YAML.safe_load(defaultYAML)
40 clusterID, clusterConfig = confs["Clusters"].first
41 $arvados_config_defaults = clusterConfig
42 $arvados_config_defaults["ClusterID"] = clusterID
43 $arvados_config_defaults["SourceTimestamp"] = Time.rfc3339(confs["SourceTimestamp"])
44 $arvados_config_defaults["SourceSHA256"] = confs["SourceSHA256"]
45
46 if ENV["ARVADOS_CONFIG"] == "none"
47   # Don't load config. This magic value is set by packaging scripts so
48   # they can run "rake assets:precompile" without a real config.
49   $arvados_config_global = $arvados_config_defaults.deep_dup
50 else
51   # Load the global config file
52   Open3.popen2("arvados-server", "config-dump", "-skip-legacy") do |stdin, stdout, status_thread|
53     confs = YAML.safe_load(stdout)
54     if confs && !confs.empty?
55       # config-dump merges defaults with user configuration, so every
56       # key should be set.
57       clusterID, clusterConfig = confs["Clusters"].first
58       $arvados_config_global = clusterConfig
59       $arvados_config_global["ClusterID"] = clusterID
60       $arvados_config_global["SourceTimestamp"] = Time.rfc3339(confs["SourceTimestamp"])
61       $arvados_config_global["SourceSHA256"] = confs["SourceSHA256"]
62     else
63       # config-dump failed, assume we will be loading from legacy
64       # application.yml, initialize with defaults.
65       $arvados_config_global = $arvados_config_defaults.deep_dup
66     end
67   end
68 end
69
70 # Now make a copy
71 $arvados_config = $arvados_config_global.deep_dup
72 $arvados_config["LoadTimestamp"] = load_time
73
74 def arrayToHash cfg, k, v
75   val = {}
76   v.each do |entry|
77     val[entry.to_s] = {}
78   end
79   ConfigLoader.set_cfg cfg, k, val
80 end
81
82 # Declare all our configuration items.
83 arvcfg = ConfigLoader.new
84 arvcfg.declare_config "ClusterID", NonemptyString, :uuid_prefix
85 arvcfg.declare_config "ManagementToken", String, :ManagementToken
86 arvcfg.declare_config "SystemRootToken", String
87 arvcfg.declare_config "Git.Repositories", String, :git_repositories_dir
88 arvcfg.declare_config "API.DisabledAPIs", Hash, :disable_api_methods, ->(cfg, k, v) { arrayToHash cfg, "API.DisabledAPIs", v }
89 arvcfg.declare_config "API.MaxRequestSize", Integer, :max_request_size
90 arvcfg.declare_config "API.MaxIndexDatabaseRead", Integer, :max_index_database_read
91 arvcfg.declare_config "API.MaxItemsPerResponse", Integer, :max_items_per_response
92 arvcfg.declare_config "API.MaxTokenLifetime", ActiveSupport::Duration
93 arvcfg.declare_config "API.RequestTimeout", ActiveSupport::Duration
94 arvcfg.declare_config "API.AsyncPermissionsUpdateInterval", ActiveSupport::Duration, :async_permissions_update_interval
95 arvcfg.declare_config "Users.AutoSetupNewUsers", Boolean, :auto_setup_new_users
96 arvcfg.declare_config "Users.AutoSetupNewUsersWithVmUUID", String, :auto_setup_new_users_with_vm_uuid
97 arvcfg.declare_config "Users.AutoSetupNewUsersWithRepository", Boolean, :auto_setup_new_users_with_repository
98 arvcfg.declare_config "Users.AutoSetupUsernameBlacklist", Hash, :auto_setup_name_blacklist, ->(cfg, k, v) { arrayToHash cfg, "Users.AutoSetupUsernameBlacklist", v }
99 arvcfg.declare_config "Users.NewUsersAreActive", Boolean, :new_users_are_active
100 arvcfg.declare_config "Users.AutoAdminUserWithEmail", String, :auto_admin_user
101 arvcfg.declare_config "Users.AutoAdminFirstUser", Boolean, :auto_admin_first_user
102 arvcfg.declare_config "Users.UserProfileNotificationAddress", String, :user_profile_notification_address
103 arvcfg.declare_config "Users.AdminNotifierEmailFrom", String, :admin_notifier_email_from
104 arvcfg.declare_config "Users.EmailSubjectPrefix", String, :email_subject_prefix
105 arvcfg.declare_config "Users.UserNotifierEmailFrom", String, :user_notifier_email_from
106 arvcfg.declare_config "Users.UserNotifierEmailBcc", Hash
107 arvcfg.declare_config "Users.NewUserNotificationRecipients", Hash, :new_user_notification_recipients, ->(cfg, k, v) { arrayToHash cfg, "Users.NewUserNotificationRecipients", v }
108 arvcfg.declare_config "Users.NewInactiveUserNotificationRecipients", Hash, :new_inactive_user_notification_recipients, method(:arrayToHash)
109 arvcfg.declare_config "Users.CanCreateRoleGroups", Boolean
110 arvcfg.declare_config "Users.RoleGroupsVisibleToAll", Boolean
111 arvcfg.declare_config "Login.LoginCluster", String
112 arvcfg.declare_config "Login.TrustedClients", Hash
113 arvcfg.declare_config "Login.RemoteTokenRefresh", ActiveSupport::Duration
114 arvcfg.declare_config "Login.TokenLifetime", ActiveSupport::Duration
115 arvcfg.declare_config "TLS.Insecure", Boolean, :sso_insecure
116 arvcfg.declare_config "AuditLogs.MaxAge", ActiveSupport::Duration, :max_audit_log_age
117 arvcfg.declare_config "AuditLogs.MaxDeleteBatch", Integer, :max_audit_log_delete_batch
118 arvcfg.declare_config "AuditLogs.UnloggedAttributes", Hash, :unlogged_attributes, ->(cfg, k, v) { arrayToHash cfg, "AuditLogs.UnloggedAttributes", v }
119 arvcfg.declare_config "SystemLogs.MaxRequestLogParamsSize", Integer, :max_request_log_params_size
120 arvcfg.declare_config "Collections.DefaultReplication", Integer, :default_collection_replication
121 arvcfg.declare_config "Collections.DefaultTrashLifetime", ActiveSupport::Duration, :default_trash_lifetime
122 arvcfg.declare_config "Collections.CollectionVersioning", Boolean, :collection_versioning
123 arvcfg.declare_config "Collections.PreserveVersionIfIdle", ActiveSupport::Duration, :preserve_version_if_idle
124 arvcfg.declare_config "Collections.TrashSweepInterval", ActiveSupport::Duration, :trash_sweep_interval
125 arvcfg.declare_config "Collections.BlobSigningKey", String, :blob_signing_key
126 arvcfg.declare_config "Collections.BlobSigningTTL", ActiveSupport::Duration, :blob_signature_ttl
127 arvcfg.declare_config "Collections.BlobSigning", Boolean, :permit_create_collection_with_unsigned_manifest, ->(cfg, k, v) { ConfigLoader.set_cfg cfg, "Collections.BlobSigning", !v }
128 arvcfg.declare_config "Collections.ForwardSlashNameSubstitution", String
129 arvcfg.declare_config "Containers.SupportedDockerImageFormats", Hash, :docker_image_formats, ->(cfg, k, v) { arrayToHash cfg, "Containers.SupportedDockerImageFormats", v }
130 arvcfg.declare_config "Containers.LogReuseDecisions", Boolean, :log_reuse_decisions
131 arvcfg.declare_config "Containers.DefaultKeepCacheRAM", Integer, :container_default_keep_cache_ram
132 arvcfg.declare_config "Containers.MaxDispatchAttempts", Integer, :max_container_dispatch_attempts
133 arvcfg.declare_config "Containers.MaxRetryAttempts", Integer, :container_count_max
134 arvcfg.declare_config "Containers.AlwaysUsePreemptibleInstances", Boolean, :preemptible_instances
135 arvcfg.declare_config "Containers.Logging.LogBytesPerEvent", Integer, :crunch_log_bytes_per_event
136 arvcfg.declare_config "Containers.Logging.LogSecondsBetweenEvents", ActiveSupport::Duration, :crunch_log_seconds_between_events
137 arvcfg.declare_config "Containers.Logging.LogThrottlePeriod", ActiveSupport::Duration, :crunch_log_throttle_period
138 arvcfg.declare_config "Containers.Logging.LogThrottleBytes", Integer, :crunch_log_throttle_bytes
139 arvcfg.declare_config "Containers.Logging.LogThrottleLines", Integer, :crunch_log_throttle_lines
140 arvcfg.declare_config "Containers.Logging.LimitLogBytesPerJob", Integer, :crunch_limit_log_bytes_per_job
141 arvcfg.declare_config "Containers.Logging.LogPartialLineThrottlePeriod", ActiveSupport::Duration, :crunch_log_partial_line_throttle_period
142 arvcfg.declare_config "Containers.Logging.LogUpdatePeriod", ActiveSupport::Duration, :crunch_log_update_period
143 arvcfg.declare_config "Containers.Logging.LogUpdateSize", Integer, :crunch_log_update_size
144 arvcfg.declare_config "Containers.Logging.MaxAge", ActiveSupport::Duration, :clean_container_log_rows_after
145 arvcfg.declare_config "Containers.SLURM.Managed.DNSServerConfDir", Pathname, :dns_server_conf_dir
146 arvcfg.declare_config "Containers.SLURM.Managed.DNSServerConfTemplate", Pathname, :dns_server_conf_template
147 arvcfg.declare_config "Containers.SLURM.Managed.DNSServerReloadCommand", String, :dns_server_reload_command
148 arvcfg.declare_config "Containers.SLURM.Managed.DNSServerUpdateCommand", String, :dns_server_update_command
149 arvcfg.declare_config "Containers.SLURM.Managed.ComputeNodeDomain", String, :compute_node_domain
150 arvcfg.declare_config "Containers.SLURM.Managed.ComputeNodeNameservers", Hash, :compute_node_nameservers, ->(cfg, k, v) { arrayToHash cfg, "Containers.SLURM.Managed.ComputeNodeNameservers", v }
151 arvcfg.declare_config "Containers.SLURM.Managed.AssignNodeHostname", String, :assign_node_hostname
152 arvcfg.declare_config "Containers.JobsAPI.Enable", String, :enable_legacy_jobs_api, ->(cfg, k, v) { ConfigLoader.set_cfg cfg, "Containers.JobsAPI.Enable", v.to_s }
153 arvcfg.declare_config "Containers.JobsAPI.GitInternalDir", String, :git_internal_dir
154 arvcfg.declare_config "Mail.MailchimpAPIKey", String, :mailchimp_api_key
155 arvcfg.declare_config "Mail.MailchimpListID", String, :mailchimp_list_id
156 arvcfg.declare_config "Services.Controller.ExternalURL", URI
157 arvcfg.declare_config "Services.Workbench1.ExternalURL", URI, :workbench_address
158 arvcfg.declare_config "Services.Websocket.ExternalURL", URI, :websocket_address
159 arvcfg.declare_config "Services.WebDAV.ExternalURL", URI, :keep_web_service_url
160 arvcfg.declare_config "Services.GitHTTP.ExternalURL", URI, :git_repo_https_base
161 arvcfg.declare_config "Services.GitSSH.ExternalURL", URI, :git_repo_ssh_base, ->(cfg, k, v) { ConfigLoader.set_cfg cfg, "Services.GitSSH.ExternalURL", "ssh://#{v}" }
162 arvcfg.declare_config "RemoteClusters", Hash, :remote_hosts, ->(cfg, k, v) {
163   h = if cfg["RemoteClusters"] then
164         cfg["RemoteClusters"].deep_dup
165       else
166         {}
167       end
168   v.each do |clusterid, host|
169     if h[clusterid].nil?
170       h[clusterid] = {
171         "Host" => host,
172         "Proxy" => true,
173         "Scheme" => "https",
174         "Insecure" => false,
175         "ActivateUsers" => false
176       }
177     end
178   end
179   ConfigLoader.set_cfg cfg, "RemoteClusters", h
180 }
181 arvcfg.declare_config "RemoteClusters.*.Proxy", Boolean, :remote_hosts_via_dns
182 arvcfg.declare_config "StorageClasses", Hash
183
184 dbcfg = ConfigLoader.new
185
186 dbcfg.declare_config "PostgreSQL.ConnectionPool", Integer, :pool
187 dbcfg.declare_config "PostgreSQL.Connection.host", String, :host
188 dbcfg.declare_config "PostgreSQL.Connection.port", String, :port
189 dbcfg.declare_config "PostgreSQL.Connection.user", String, :username
190 dbcfg.declare_config "PostgreSQL.Connection.password", String, :password
191 dbcfg.declare_config "PostgreSQL.Connection.dbname", String, :database
192 dbcfg.declare_config "PostgreSQL.Connection.template", String, :template
193 dbcfg.declare_config "PostgreSQL.Connection.encoding", String, :encoding
194 dbcfg.declare_config "PostgreSQL.Connection.collation", String, :collation
195
196 application_config = {}
197 %w(application.default application).each do |cfgfile|
198   path = "#{::Rails.root.to_s}/config/#{cfgfile}.yml"
199   confs = ConfigLoader.load(path, erb: true)
200   # Ignore empty YAML file:
201   next if confs == nil
202   application_config.deep_merge!(confs['common'] || {})
203   application_config.deep_merge!(confs[::Rails.env.to_s] || {})
204 end
205
206 db_config = {}
207 path = "#{::Rails.root.to_s}/config/database.yml"
208 if !ENV['ARVADOS_CONFIG_NOLEGACY'] && File.exist?(path)
209   db_config = ConfigLoader.load(path, erb: true)
210 end
211
212 $remaining_config = arvcfg.migrate_config(application_config, $arvados_config)
213 dbcfg.migrate_config(db_config[::Rails.env.to_s] || {}, $arvados_config)
214
215 if application_config[:auto_activate_users_from]
216   application_config[:auto_activate_users_from].each do |cluster|
217     if $arvados_config.RemoteClusters[cluster]
218       $arvados_config.RemoteClusters[cluster]["ActivateUsers"] = true
219     end
220   end
221 end
222
223 if application_config[:host] || application_config[:port] || application_config[:scheme]
224   if !application_config[:host] || application_config[:host].empty?
225     raise "Must set 'host' when setting 'port' or 'scheme'"
226   end
227   $arvados_config.Services["Controller"]["ExternalURL"] = URI((application_config[:scheme] || "https")+"://"+application_config[:host]+
228                                                               (if application_config[:port] then ":#{application_config[:port]}" else "" end))
229 end
230
231 # Checks for wrongly typed configuration items, coerces properties
232 # into correct types (such as Duration), and optionally raise error
233 # for essential configuration that can't be empty.
234 arvcfg.coercion_and_check $arvados_config_defaults, check_nonempty: false
235 arvcfg.coercion_and_check $arvados_config_global, check_nonempty: false
236 arvcfg.coercion_and_check $arvados_config, check_nonempty: true
237 dbcfg.coercion_and_check $arvados_config, check_nonempty: true
238
239 # * $arvados_config_defaults is the defaults
240 # * $arvados_config_global is $arvados_config_defaults merged with the contents of /etc/arvados/config.yml
241 # These are used by the rake config: tasks
242 #
243 # * $arvados_config is $arvados_config_global merged with the migrated contents of application.yml
244 # This is what actually gets copied into the Rails configuration object.
245
246 if $arvados_config["Collections"]["DefaultTrashLifetime"] < 86400.seconds then
247   raise "default_trash_lifetime is %d, must be at least 86400" % Rails.configuration.Collections.DefaultTrashLifetime
248 end
249
250 default_storage_classes = []
251 $arvados_config["StorageClasses"].each do |cls, cfg|
252   if cfg["Default"]
253     default_storage_classes << cls
254   end
255 end
256 if default_storage_classes.length == 0
257   default_storage_classes = ["default"]
258 end
259 $arvados_config["DefaultStorageClasses"] = default_storage_classes.sort
260
261 #
262 # Special case for test database where there's no database.yml,
263 # because the Arvados config.yml doesn't have a concept of multiple
264 # rails environments.
265 #
266 if ::Rails.env.to_s == "test" && db_config["test"].nil?
267   $arvados_config["PostgreSQL"]["Connection"]["dbname"] = "arvados_test"
268 end
269 if ::Rails.env.to_s == "test"
270   # Use template0 when creating a new database. Avoids
271   # character-encoding/collation problems.
272   $arvados_config["PostgreSQL"]["Connection"]["template"] = "template0"
273   # Some test cases depend on en_US.UTF-8 collation.
274   $arvados_config["PostgreSQL"]["Connection"]["collation"] = "en_US.UTF-8"
275 end
276
277 if ENV["ARVADOS_CONFIG"] == "none"
278   # We need the postgresql connection URI to be valid, even if we
279   # don't use it.
280   $arvados_config["PostgreSQL"]["Connection"]["host"] = "localhost"
281   $arvados_config["PostgreSQL"]["Connection"]["user"] = "x"
282   $arvados_config["PostgreSQL"]["Connection"]["password"] = "x"
283   $arvados_config["PostgreSQL"]["Connection"]["dbname"] = "x"
284 end
285
286 if $arvados_config["PostgreSQL"]["Connection"]["password"].empty?
287   raise "Database password is empty, PostgreSQL section is: #{$arvados_config["PostgreSQL"]}"
288 end
289
290 dbhost = $arvados_config["PostgreSQL"]["Connection"]["host"]
291 if $arvados_config["PostgreSQL"]["Connection"]["port"] != 0
292   dbhost += ":#{$arvados_config["PostgreSQL"]["Connection"]["port"]}"
293 end
294
295 #
296 # If DATABASE_URL is set, then ActiveRecord won't error out if database.yml doesn't exist.
297 #
298 # For config migration, we've previously populated the PostgreSQL
299 # section of the config from database.yml
300 #
301 database_url = "postgresql://#{CGI.escape $arvados_config["PostgreSQL"]["Connection"]["user"]}:"+
302                       "#{CGI.escape $arvados_config["PostgreSQL"]["Connection"]["password"]}@"+
303                       "#{dbhost}/#{CGI.escape $arvados_config["PostgreSQL"]["Connection"]["dbname"]}?"+
304                       "template=#{$arvados_config["PostgreSQL"]["Connection"]["template"]}&"+
305                       "encoding=#{$arvados_config["PostgreSQL"]["Connection"]["client_encoding"]}&"+
306                       "collation=#{$arvados_config["PostgreSQL"]["Connection"]["collation"]}&"+
307                       "pool=#{$arvados_config["PostgreSQL"]["ConnectionPool"]}"
308
309 ENV["DATABASE_URL"] = database_url
310
311 Server::Application.configure do
312   # Copy into the Rails config object.  This also turns Hash into
313   # OrderedOptions so that application code can use
314   # Rails.configuration.API.Blah instead of
315   # Rails.configuration.API["Blah"]
316   ConfigLoader.copy_into_config $arvados_config, config
317   ConfigLoader.copy_into_config $remaining_config, config
318
319   # We don't rely on cookies for authentication, so instead of
320   # requiring a signing key in config, we assign a new random one at
321   # startup.
322   secrets.secret_key_base = rand(1<<255).to_s(36)
323 end