git.arvados.org - arvados.git/blob - lib/config/config.default.yml

2 #

3 # SPDX-License-Identifier: AGPL-3.0

4

5 # Do not use this file for site configuration. Create

6 # /etc/arvados/config.yml instead.

7 #

8 # The order of precedence (highest to lowest):

9 # 1. Legacy component-specific config files (deprecated)

10 # 2. /etc/arvados/config.yml

11 # 3. config.default.yml

12

13 Clusters:

14 xxxxx:

15 SystemRootToken: ""

16

17 # Token to be included in all healthcheck requests. Disabled by default.

18 # Server expects request header of the format "Authorization: Bearer xxx"

19 ManagementToken: ""

20

21 Services:

22 RailsAPI:

23 InternalURLs: {}

24 GitHTTP:

25 InternalURLs: {}

26 ExternalURL: ""

27 Keepstore:

28 InternalURLs: {}

29 Controller:

30 InternalURLs: {}

31 ExternalURL: ""

32 Websocket:

33 InternalURLs: {}

34 ExternalURL: ""

35 Keepbalance:

36 InternalURLs: {}

37 GitHTTP:

38 InternalURLs: {}

39 ExternalURL: ""

40 GitSSH:

41 ExternalURL: ""

42 DispatchCloud:

43 InternalURLs: {}

44 SSO:

45 ExternalURL: ""

46 Keepproxy:

47 InternalURLs: {}

48 ExternalURL: ""

49 WebDAV:

50 InternalURLs: {}

51 ExternalURL: ""

52 WebDAVDownload:

53 InternalURLs: {}

54 ExternalURL: ""

55 Keepstore:

56 InternalURLs: {}

57 Composer:

58 ExternalURL: ""

59 WebShell:

60 ExternalURL: ""

61 Workbench1:

62 InternalURLs: {}

63 ExternalURL: ""

64 Workbench2:

65 ExternalURL: ""

66 PostgreSQL:

67 # max concurrent connections per arvados server daemon

68 ConnectionPool: 32

69 Connection:

70 # All parameters here are passed to the PG client library in a connection string;

71 # see https://www.postgresql.org/docs/current/static/libpq-connect.html#LIBPQ-PARAMKEYWORDS

72 host: ""

73 port: ""

74 user: ""

75 password: ""

76 dbname: ""

77 API:

78 # Maximum size (in bytes) allowed for a single API request. This

79 # limit is published in the discovery document for use by clients.

80 # Note: You must separately configure the upstream web server or

81 # proxy to actually enforce the desired maximum request size on the

82 # server side.

83 MaxRequestSize: 134217728

84

85 # Limit the number of bytes read from the database during an index

86 # request (by retrieving and returning fewer rows than would

87 # normally be returned in a single response).

88 # Note 1: This setting never reduces the number of returned rows to

89 # zero, no matter how big the first data row is.

90 # Note 2: Currently, this is only checked against a specific set of

91 # columns that tend to get large (collections.manifest_text,

92 # containers.mounts, workflows.definition). Other fields (e.g.,

93 # "properties" hashes) are not counted against this limit.

94 MaxIndexDatabaseRead: 134217728

95

96 # Maximum number of items to return when responding to a APIs that

97 # can return partial result sets using limit and offset parameters

98 # (e.g., *.index, groups.contents). If a request specifies a "limit"

99 # parameter higher than this value, this value is used instead.

100 MaxItemsPerResponse: 1000

101

102 # API methods to disable. Disabled methods are not listed in the

103 # discovery document, and respond 404 to all requests.

104 # Example: ["jobs.create", "pipeline_instances.create"]

105 DisabledAPIs: []

106

107 # Interval (seconds) between asynchronous permission view updates. Any

108 # permission-updating API called with the 'async' parameter schedules a an

109 # update on the permission view in the future, if not already scheduled.

110 AsyncPermissionsUpdateInterval: 20

111

112 # Maximum number of concurrent outgoing requests to make while

113 # serving a single incoming multi-cluster (federated) request.

114 MaxRequestAmplification: 4

115

116 # RailsSessionSecretToken is a string of alphanumeric characters

117 # used by Rails to sign session tokens. IMPORTANT: This is a

118 # site secret. It should be at least 50 characters.

119 RailsSessionSecretToken: ""

120

121 Users:

122 # Config parameters to automatically setup new users. If enabled,

123 # this users will be able to self-activate. Enable this if you want

124 # to run an open instance where anyone can create an account and use

125 # the system without requiring manual approval.

126 #

127 # The params auto_setup_new_users_with_* are meaningful only when auto_setup_new_users is turned on.

128 # auto_setup_name_blacklist is a list of usernames to be blacklisted for auto setup.

129 AutoSetupNewUsers: false

130 AutoSetupNewUsersWithVmUUID: ""

131 AutoSetupNewUsersWithRepository: false

132 AutoSetupUsernameBlacklist: [arvados, git, gitolite, gitolite-admin, root, syslog]

133

134 # When new_users_are_active is set to true, new users will be active

135 # immediately. This skips the "self-activate" step which enforces

136 # user agreements. Should only be enabled for development.

137 NewUsersAreActive: false

138

139 # The e-mail address of the user you would like to become marked as an admin

140 # user on their first login.

141 # In the default configuration, authentication happens through the Arvados SSO

142 # server, which uses OAuth2 against Google's servers, so in that case this

143 # should be an address associated with a Google account.

144 AutoAdminUserWithEmail: ""

145

146 # If auto_admin_first_user is set to true, the first user to log in when no

147 # other admin users exist will automatically become an admin user.

148 AutoAdminFirstUser: false

149

150 # Email address to notify whenever a user creates a profile for the

151 # first time

152 UserProfileNotificationAddress: ""

153 AdminNotifierEmailFrom: arvados@example.com

154 EmailSubjectPrefix: "[ARVADOS] "

155 UserNotifierEmailFrom: arvados@example.com

156 NewUserNotificationRecipients: []

157 NewInactiveUserNotificationRecipients: []

158

159 AuditLogs:

160 # Time to keep audit logs, in seconds. (An audit log is a row added

161 # to the "logs" table in the PostgreSQL database each time an

162 # Arvados object is created, modified, or deleted.)

163 #

164 # Currently, websocket event notifications rely on audit logs, so

165 # this should not be set lower than 300 (5 minutes).

166 MaxAge: 336h

167

168 # Maximum number of log rows to delete in a single SQL transaction.

169 #

170 # If max_audit_log_delete_batch is 0, log entries will never be

171 # deleted by Arvados. Cleanup can be done by an external process

172 # without affecting any Arvados system processes, as long as very

173 # recent (<5 minutes old) logs are not deleted.

174 #

175 # 100000 is a reasonable batch size for most sites.

176 MaxDeleteBatch: 0

177

178 # Attributes to suppress in events and audit logs. Notably,

179 # specifying ["manifest_text"] here typically makes the database

180 # smaller and faster.

181 #

182 # Warning: Using any non-empty value here can have undesirable side

183 # effects for any client or component that relies on event logs.

184 # Use at your own risk.

185 UnloggedAttributes: []

186

187 SystemLogs:

188 # Maximum characters of (JSON-encoded) query parameters to include

189 # in each request log entry. When params exceed this size, they will

190 # be JSON-encoded, truncated to this size, and logged as

191 # params_truncated.

192 MaxRequestLogParamsSize: 2000

193

194 Collections:

195 # Allow clients to create collections by providing a manifest with

196 # unsigned data blob locators. IMPORTANT: This effectively disables

197 # access controls for data stored in Keep: a client who knows a hash

198 # can write a manifest that references the hash, pass it to

199 # collections.create (which will create a permission link), use

200 # collections.get to obtain a signature for that data locator, and

201 # use that signed locator to retrieve the data from Keep. Therefore,

202 # do not turn this on if your users expect to keep data private from

203 # one another!

204 BlobSigning: true

205

206 # blob_signing_key is a string of alphanumeric characters used to

207 # generate permission signatures for Keep locators. It must be

208 # identical to the permission key given to Keep. IMPORTANT: This is

209 # a site secret. It should be at least 50 characters.

210 #

211 # Modifying blob_signing_key will invalidate all existing

212 # signatures, which can cause programs to fail (e.g., arv-put,

213 # arv-get, and Crunch jobs). To avoid errors, rotate keys only when

214 # no such processes are running.

215 BlobSigningKey: ""

216

217 # Default replication level for collections. This is used when a

218 # collection's replication_desired attribute is nil.

219 DefaultReplication: 2

220

221 # Lifetime (in seconds) of blob permission signatures generated by

222 # the API server. This determines how long a client can take (after

223 # retrieving a collection record) to retrieve the collection data

224 # from Keep. If the client needs more time than that (assuming the

225 # collection still has the same content and the relevant user/token

226 # still has permission) the client can retrieve the collection again

227 # to get fresh signatures.

228 #

229 # This must be exactly equal to the -blob-signature-ttl flag used by

230 # keepstore servers. Otherwise, reading data blocks and saving

231 # collections will fail with HTTP 403 permission errors.

232 #

233 # Modifying blob_signature_ttl invalidates existing signatures; see

234 # blob_signing_key note above.

235 #

236 # The default is 2 weeks.

237 BlobSigningTTL: 336h

238

239 # Default lifetime for ephemeral collections: 2 weeks. This must not

240 # be less than blob_signature_ttl.

241 DefaultTrashLifetime: 336h

242

243 # Interval (seconds) between trash sweeps. During a trash sweep,

244 # collections are marked as trash if their trash_at time has

245 # arrived, and deleted if their delete_at time has arrived.

246 TrashSweepInterval: 60

247

248 # If true, enable collection versioning.

249 # When a collection's preserve_version field is true or the current version

250 # is older than the amount of seconds defined on preserve_version_if_idle,

251 # a snapshot of the collection's previous state is created and linked to

252 # the current collection.

253 CollectionVersioning: false

254

255 # 0 = auto-create a new version on every update.

256 # -1 = never auto-create new versions.

257 # > 0 = auto-create a new version when older than the specified number of seconds.

258 PreserveVersionIfIdle: -1

259

260 Login:

261 # These settings are provided by your OAuth2 provider (e.g.,

262 # sso-provider).

263 ProviderAppSecret: ""

264 ProviderAppID: ""

265

266 Git:

267 # Git repositories must be readable by api server, or you won't be

268 # able to submit crunch jobs. To pass the test suites, put a clone

269 # of the arvados tree in {git_repositories_dir}/arvados.git or

270 # {git_repositories_dir}/arvados/.git

271 Repositories: /var/lib/arvados/git/repositories

272

273 TLS:

274 Insecure: false

275

276 Containers:

277 # List of supported Docker Registry image formats that compute nodes

278 # are able to use. `arv keep docker` will error out if a user tries

279 # to store an image with an unsupported format. Use an empty array

280 # to skip the compatibility check (and display a warning message to

281 # that effect).

282 #

283 # Example for sites running docker < 1.10: ["v1"]

284 # Example for sites running docker >= 1.10: ["v2"]

285 # Example for disabling check: []

286 SupportedDockerImageFormats: ["v2"]

287

288 # Include details about job reuse decisions in the server log. This

289 # causes additional database queries to run, so it should not be

290 # enabled unless you expect to examine the resulting logs for

291 # troubleshooting purposes.

292 LogReuseDecisions: false

293

294 # Default value for keep_cache_ram of a container's runtime_constraints.

295 DefaultKeepCacheRAM: 268435456

296

297 # Number of times a container can be unlocked before being

298 # automatically cancelled.

299 MaxDispatchAttempts: 5

300

301 # Default value for container_count_max for container requests. This is the

302 # number of times Arvados will create a new container to satisfy a container

303 # request. If a container is cancelled it will retry a new container if

304 # container_count < container_count_max on any container requests associated

305 # with the cancelled container.

306 MaxRetryAttempts: 3

307

308 # The maximum number of compute nodes that can be in use simultaneously

309 # If this limit is reduced, any existing nodes with slot number >= new limit

310 # will not be counted against the new limit. In other words, the new limit

311 # won't be strictly enforced until those nodes with higher slot numbers

312 # go down.

313 MaxComputeVMs: 64

314

315 # Preemptible instance support (e.g. AWS Spot Instances)

316 # When true, child containers will get created with the preemptible

317 # scheduling parameter parameter set.

318 UsePreemptibleInstances: false

319

320 # Include details about job reuse decisions in the server log. This

321 # causes additional database queries to run, so it should not be

322 # enabled unless you expect to examine the resulting logs for

323 # troubleshooting purposes.

324 LogReuseDecisions: false

325

326 Logging:

327 # When you run the db:delete_old_container_logs task, it will find

328 # containers that have been finished for at least this many seconds,

329 # and delete their stdout, stderr, arv-mount, crunch-run, and

330 # crunchstat logs from the logs table.

331 MaxAge: 720h

332

333 # These two settings control how frequently log events are flushed to the

334 # database. Log lines are buffered until either crunch_log_bytes_per_event

335 # has been reached or crunch_log_seconds_between_events has elapsed since

336 # the last flush.

337 LogBytesPerEvent: 4096

338 LogSecondsBetweenEvents: 1

339

340 # The sample period for throttling logs, in seconds.

341 LogThrottlePeriod: 60

342

343 # Maximum number of bytes that job can log over crunch_log_throttle_period

344 # before being silenced until the end of the period.

345 LogThrottleBytes: 65536

346

347 # Maximum number of lines that job can log over crunch_log_throttle_period

348 # before being silenced until the end of the period.

349 LogThrottleLines: 1024

350

351 # Maximum bytes that may be logged by a single job. Log bytes that are

352 # silenced by throttling are not counted against this total.

353 LimitLogBytesPerJob: 67108864

354

355 LogPartialLineThrottlePeriod: 5

356

357 # Container logs are written to Keep and saved in a collection,

358 # which is updated periodically while the container runs. This

359 # value sets the interval (given in seconds) between collection

360 # updates.

361 LogUpdatePeriod: 1800

362

363 # The log collection is also updated when the specified amount of

364 # log data (given in bytes) is produced in less than one update

365 # period.

366 LogUpdateSize: 33554432

367

368 SLURM:

369 Managed:

370 # Path to dns server configuration directory

371 # (e.g. /etc/unbound.d/conf.d). If false, do not write any config

372 # files or touch restart.txt (see below).

373 DNSServerConfDir: ""

374

375 # Template file for the dns server host snippets. See

376 # unbound.template in this directory for an example. If false, do

377 # not write any config files.

378 DNSServerConfTemplate: ""

379

380 # String to write to {dns_server_conf_dir}/restart.txt (with a

381 # trailing newline) after updating local data. If false, do not

382 # open or write the restart.txt file.

383 DNSServerReloadCommand: ""

384

385 # Command to run after each DNS update. Template variables will be

386 # substituted; see the "unbound" example below. If false, do not run

387 # a command.

388 DNSServerUpdateCommand: ""

389

390 ComputeNodeDomain: ""

391 ComputeNodeNameservers:

392 - 192.168.1.1

393

394 # Hostname to assign to a compute node when it sends a "ping" and the

395 # hostname in its Node record is nil.

396 # During bootstrapping, the "ping" script is expected to notice the

397 # hostname given in the ping response, and update its unix hostname

398 # accordingly.

399 # If false, leave the hostname alone (this is appropriate if your compute

400 # nodes' hostnames are already assigned by some other mechanism).

401 #

402 # One way or another, the hostnames of your node records should agree

403 # with your DNS records and your /etc/slurm-llnl/slurm.conf files.

404 #

405 # Example for compute0000, compute0001, ....:

406 # assign_node_hostname: compute%<slot_number>04d

407 # (See http://ruby-doc.org/core-2.2.2/Kernel.html#method-i-format for more.)

408 AssignNodeHostname: "compute%<slot_number>d"

409

410 JobsAPI:

411 # Enable the legacy Jobs API. This value must be a string.

412 # 'auto' -- (default) enable the Jobs API only if it has been used before

413 # (i.e., there are job records in the database)

414 # 'true' -- enable the Jobs API despite lack of existing records.

415 # 'false' -- disable the Jobs API despite presence of existing records.

416 Enable: 'auto'

417

418 # Git repositories must be readable by api server, or you won't be

419 # able to submit crunch jobs. To pass the test suites, put a clone

420 # of the arvados tree in {git_repositories_dir}/arvados.git or

421 # {git_repositories_dir}/arvados/.git

422 GitInternalDir: /var/lib/arvados/internal.git

423

424 # Docker image to be used when none found in runtime_constraints of a job

425 DefaultDockerImage: ""

426

427 # none or slurm_immediate

428 CrunchJobWrapper: none

429

430 # username, or false = do not set uid when running jobs.

431 CrunchJobUser: crunch

432

433 # The web service must be able to create/write this file, and

434 # crunch-job must be able to stat() it.

435 CrunchRefreshTrigger: /tmp/crunch_refresh_trigger

436

437 # Control job reuse behavior when two completed jobs match the

438 # search criteria and have different outputs.

439 #

440 # If true, in case of a conflict, reuse the earliest job (this is

441 # similar to container reuse behavior).

442 #

443 # If false, in case of a conflict, do not reuse any completed job,

444 # but do reuse an already-running job if available (this is the

445 # original job reuse behavior, and is still the default).

446 ReuseJobIfOutputsDiffer: false

447

448 Mail:

449 MailchimpAPIKey: ""

450 MailchimpListID: ""

451 SendUserSetupNotificationEmail: ""

452 IssueReporterEmailFrom: ""

453 IssueReporterEmailTo: ""

454 SupportEmailAddress: ""

455 EmailFrom: ""

456 RemoteClusters:

457 "*":

458 Proxy: false

459 ActivateUsers: false