git.arvados.org - arvados.git/blob - lib/config/config.default.yml

2 #

3 # SPDX-License-Identifier: AGPL-3.0

4

5 # Do not use this file for site configuration. Create

6 # /etc/arvados/config.yml instead.

7 #

8 # The order of precedence (highest to lowest):

9 # 1. Legacy component-specific config files (deprecated)

10 # 2. /etc/arvados/config.yml

11 # 3. config.default.yml

12

13 Clusters:

14 xxxxx:

15 SystemRootToken: ""

16

17 # Token to be included in all healthcheck requests. Disabled by default.

18 # Server expects request header of the format "Authorization: Bearer xxx"

19 ManagementToken: ""

20

21 Services:

22

23 # In each of the service sections below, the keys under

24 # InternalURLs are the endpoints where the service should be

25 # listening, and reachable from other hosts in the cluster.

26 SAMPLE:

27 InternalURLs:

28 "http://host1.example:12345": {}

29 "http://host2.example:12345":

30 # Rendezvous is normally empty/omitted. When changing the

31 # URL of a Keepstore service, Rendezvous should be set to

32 # the old URL (with trailing slash omitted) to preserve

33 # rendezvous ordering.

34 Rendezvous: ""

35 SAMPLE:

36 Rendezvous: ""

37 ExternalURL: "-"

38

39 RailsAPI:

40 InternalURLs: {}

41 ExternalURL: "-"

42 Controller:

43 InternalURLs: {}

44 ExternalURL: ""

45 Websocket:

46 InternalURLs: {}

47 ExternalURL: ""

48 Keepbalance:

49 InternalURLs: {}

50 ExternalURL: "-"

51 GitHTTP:

52 InternalURLs: {}

53 ExternalURL: ""

54 GitSSH:

55 InternalURLs: {}

56 ExternalURL: ""

57 DispatchCloud:

58 InternalURLs: {}

59 ExternalURL: "-"

60 SSO:

61 InternalURLs: {}

62 ExternalURL: ""

63 Keepproxy:

64 InternalURLs: {}

65 ExternalURL: ""

66 WebDAV:

67 InternalURLs: {}

68 # Base URL for Workbench inline preview. If blank, use

69 # WebDAVDownload instead, and disable inline preview.

70 # If both are empty, downloading collections from workbench

71 # will be impossible.

72 #

73 # It is important to properly configure the download service

74 # to migitate cross-site-scripting (XSS) attacks. A HTML page

75 # can be stored in collection. If an attacker causes a victim

76 # to visit that page through Workbench, it will be rendered by

77 # the browser. If all collections are served at the same

78 # domain, the browser will consider collections as coming from

79 # the same origin and having access to the same browsing data,

80 # enabling malicious Javascript on that page to access Arvados

81 # on behalf of the victim.

82 #

83 # This is mitigating by having separate domains for each

84 # collection, or limiting preview to circumstances where the

85 # collection is not accessed with the user's regular

86 # full-access token.

87 #

88 # Serve preview links using uuid or pdh in subdomain

89 # (requires wildcard DNS and TLS certificate)

90 # https://*.collections.uuid_prefix.arvadosapi.com

91 #

92 # Serve preview links using uuid or pdh in main domain

93 # (requires wildcard DNS and TLS certificate)

94 # https://*--collections.uuid_prefix.arvadosapi.com

95 #

96 # Serve preview links by setting uuid or pdh in the path.

97 # This configuration only allows previews of public data or

98 # collection-sharing links, because these use the anonymous

99 # user token or the token is already embedded in the URL.

100 # Other data must be handled as downloads via WebDAVDownload:

101 # https://collections.uuid_prefix.arvadosapi.com

102 #

103 ExternalURL: ""

104

105 WebDAVDownload:

106 InternalURLs: {}

107 # Base URL for download links. If blank, serve links to WebDAV

108 # with disposition=attachment query param. Unlike preview links,

109 # browsers do not render attachments, so there is no risk of XSS.

110 #

111 # If WebDAVDownload is blank, and WebDAV uses a

112 # single-origin form, then Workbench will show an error page

113 #

114 # Serve download links by setting uuid or pdh in the path:

115 # https://download.uuid_prefix.arvadosapi.com

116 #

117 ExternalURL: ""

118

119 Keepstore:

120 InternalURLs: {}

121 ExternalURL: "-"

122 Composer:

123 InternalURLs: {}

124 ExternalURL: ""

125 WebShell:

126 InternalURLs: {}

127 # ShellInABox service endpoint URL for a given VM. If empty, do not

128 # offer web shell logins.

129 #

130 # E.g., using a path-based proxy server to forward connections to shell hosts:

131 # https://webshell.uuid_prefix.arvadosapi.com

132 #

133 # E.g., using a name-based proxy server to forward connections to shell hosts:

134 # https://*.webshell.uuid_prefix.arvadosapi.com

135 ExternalURL: ""

136 Workbench1:

137 InternalURLs: {}

138 ExternalURL: ""

139 Workbench2:

140 InternalURLs: {}

141 ExternalURL: ""

142 Nodemanager:

143 InternalURLs: {}

144 ExternalURL: "-"

145 Health:

146 InternalURLs: {}

147 ExternalURL: "-"

148

149 PostgreSQL:

150 # max concurrent connections per arvados server daemon

151 ConnectionPool: 32

152 Connection:

153 # All parameters here are passed to the PG client library in a connection string;

154 # see https://www.postgresql.org/docs/current/static/libpq-connect.html#LIBPQ-PARAMKEYWORDS

155 host: ""

156 port: ""

157 user: ""

158 password: ""

159 dbname: ""

160 SAMPLE: ""

161 API:

162 # Maximum size (in bytes) allowed for a single API request. This

163 # limit is published in the discovery document for use by clients.

164 # Note: You must separately configure the upstream web server or

165 # proxy to actually enforce the desired maximum request size on the

166 # server side.

167 MaxRequestSize: 134217728

168

169 # Limit the number of bytes read from the database during an index

170 # request (by retrieving and returning fewer rows than would

171 # normally be returned in a single response).

172 # Note 1: This setting never reduces the number of returned rows to

173 # zero, no matter how big the first data row is.

174 # Note 2: Currently, this is only checked against a specific set of

175 # columns that tend to get large (collections.manifest_text,

176 # containers.mounts, workflows.definition). Other fields (e.g.,

177 # "properties" hashes) are not counted against this limit.

178 MaxIndexDatabaseRead: 134217728

179

180 # Maximum number of items to return when responding to a APIs that

181 # can return partial result sets using limit and offset parameters

182 # (e.g., *.index, groups.contents). If a request specifies a "limit"

183 # parameter higher than this value, this value is used instead.

184 MaxItemsPerResponse: 1000

185

186 # Maximum number of concurrent requests to accept in a single

187 # service process, or 0 for no limit.

188 MaxConcurrentRequests: 0

189

190 # Maximum number of 64MiB memory buffers per Keepstore server process, or

191 # 0 for no limit. When this limit is reached, up to

192 # (MaxConcurrentRequests - MaxKeepBlobBuffers) HTTP requests requiring

193 # buffers (like GET and PUT) will wait for buffer space to be released.

194 # Any HTTP requests beyond MaxConcurrentRequests will receive an

195 # immediate 503 response.

196 #

197 # MaxKeepBlobBuffers should be set such that (MaxKeepBlobBuffers * 64MiB

198 # * 1.1) fits comfortably in memory. On a host dedicated to running

199 # Keepstore, divide total memory by 88MiB to suggest a suitable value.

200 # For example, if grep MemTotal /proc/meminfo reports MemTotal: 7125440

201 # kB, compute 7125440 / (88 * 1024)=79 and configure MaxBuffers: 79

202 MaxKeepBlobBuffers: 128

203

204 # API methods to disable. Disabled methods are not listed in the

205 # discovery document, and respond 404 to all requests.

206 # Example: {"jobs.create":{}, "pipeline_instances.create": {}}

207 DisabledAPIs: {}

208

209 # Interval (seconds) between asynchronous permission view updates. Any

210 # permission-updating API called with the 'async' parameter schedules a an

211 # update on the permission view in the future, if not already scheduled.

212 AsyncPermissionsUpdateInterval: 20s

213

214 # Maximum number of concurrent outgoing requests to make while

215 # serving a single incoming multi-cluster (federated) request.

216 MaxRequestAmplification: 4

217

218 # RailsSessionSecretToken is a string of alphanumeric characters

219 # used by Rails to sign session tokens. IMPORTANT: This is a

220 # site secret. It should be at least 50 characters.

221 RailsSessionSecretToken: ""

222

223 # Maximum wall clock time to spend handling an incoming request.

224 RequestTimeout: 5m

225

226 # Websocket will send a periodic empty event after 'SendTimeout'

227 # if there is no other activity to maintain the connection /

228 # detect dropped connections.

229 SendTimeout: 60s

230

231 WebsocketClientEventQueue: 64

232 WebsocketServerEventQueue: 4

233

234 # Timeout on requests to internal Keep services.

235 KeepServiceRequestTimeout: 15s

236

237 Users:

238 # Config parameters to automatically setup new users. If enabled,

239 # this users will be able to self-activate. Enable this if you want

240 # to run an open instance where anyone can create an account and use

241 # the system without requiring manual approval.

242 #

243 # The params AutoSetupNewUsersWith* are meaningful only when AutoSetupNewUsers is turned on.

244 # AutoSetupUsernameBlacklist is a list of usernames to be blacklisted for auto setup.

245 AutoSetupNewUsers: false

246 AutoSetupNewUsersWithVmUUID: ""

247 AutoSetupNewUsersWithRepository: false

248 AutoSetupUsernameBlacklist:

249 arvados: {}

250 git: {}

251 gitolite: {}

252 gitolite-admin: {}

253 root: {}

254 syslog: {}

255 SAMPLE: {}

256

257 # When NewUsersAreActive is set to true, new users will be active

258 # immediately. This skips the "self-activate" step which enforces

259 # user agreements. Should only be enabled for development.

260 NewUsersAreActive: false

261

262 # The e-mail address of the user you would like to become marked as an admin

263 # user on their first login.

264 # In the default configuration, authentication happens through the Arvados SSO

265 # server, which uses OAuth2 against Google's servers, so in that case this

266 # should be an address associated with a Google account.

267 AutoAdminUserWithEmail: ""

268

269 # If AutoAdminFirstUser is set to true, the first user to log in when no

270 # other admin users exist will automatically become an admin user.

271 AutoAdminFirstUser: false

272

273 # Email address to notify whenever a user creates a profile for the

274 # first time

275 UserProfileNotificationAddress: ""

276 AdminNotifierEmailFrom: arvados@example.com

277 EmailSubjectPrefix: "[ARVADOS] "

278 UserNotifierEmailFrom: arvados@example.com

279 NewUserNotificationRecipients: {}

280 NewInactiveUserNotificationRecipients: {}

281

282 # Set AnonymousUserToken to enable anonymous user access. You can get

283 # the token by running "bundle exec ./script/get_anonymous_user_token.rb"

284 # in the directory where your API server is running.

285 AnonymousUserToken: ""

286

287 # If a new user has an alternate email address (local@domain)

288 # with the domain given here, its local part becomes the new

289 # user's default username. Otherwise, the user's primary email

290 # address is used.

291 PreferDomainForUsername: ""

292

293 AuditLogs:

294 # Time to keep audit logs, in seconds. (An audit log is a row added

295 # to the "logs" table in the PostgreSQL database each time an

296 # Arvados object is created, modified, or deleted.)

297 #

298 # Currently, websocket event notifications rely on audit logs, so

299 # this should not be set lower than 300 (5 minutes).

300 MaxAge: 336h

301

302 # Maximum number of log rows to delete in a single SQL transaction.

303 #

304 # If MaxDeleteBatch is 0, log entries will never be

305 # deleted by Arvados. Cleanup can be done by an external process

306 # without affecting any Arvados system processes, as long as very

307 # recent (<5 minutes old) logs are not deleted.

308 #

309 # 100000 is a reasonable batch size for most sites.

310 MaxDeleteBatch: 0

311

312 # Attributes to suppress in events and audit logs. Notably,

313 # specifying {"manifest_text": {}} here typically makes the database

314 # smaller and faster.

315 #

316 # Warning: Using any non-empty value here can have undesirable side

317 # effects for any client or component that relies on event logs.

318 # Use at your own risk.

319 UnloggedAttributes: {}

320

321 SystemLogs:

322

323 # Logging threshold: panic, fatal, error, warn, info, debug, or

324 # trace

325 LogLevel: info

326

327 # Logging format: json or text

328 Format: json

329

330 # Maximum characters of (JSON-encoded) query parameters to include

331 # in each request log entry. When params exceed this size, they will

332 # be JSON-encoded, truncated to this size, and logged as

333 # params_truncated.

334 MaxRequestLogParamsSize: 2000

335

336 Collections:

337

338 # Enable access controls for data stored in Keep. This should

339 # always be set to true on a production cluster.

340 BlobSigning: true

341

342 # BlobSigningKey is a string of alphanumeric characters used to

343 # generate permission signatures for Keep locators. It must be

344 # identical to the permission key given to Keep. IMPORTANT: This

345 # is a site secret. It should be at least 50 characters.

346 #

347 # Modifying BlobSigningKey will invalidate all existing

348 # signatures, which can cause programs to fail (e.g., arv-put,

349 # arv-get, and Crunch jobs). To avoid errors, rotate keys only

350 # when no such processes are running.

351 BlobSigningKey: ""

352

353 # Enable garbage collection of unreferenced blobs in Keep.

354 BlobTrash: true

355

356 # Time to leave unreferenced blobs in "trashed" state before

357 # deleting them, or 0 to skip the "trashed" state entirely and

358 # delete unreferenced blobs.

359 #

360 # If you use any Amazon S3 buckets as storage volumes, this

361 # must be at least 24h to avoid occasional data loss.

362 BlobTrashLifetime: 336h

363

364 # How often to check for (and delete) trashed blocks whose

365 # BlobTrashLifetime has expired.

366 BlobTrashCheckInterval: 24h

367

368 # Maximum number of concurrent "trash blob" and "delete trashed

369 # blob" operations conducted by a single keepstore process. Each

370 # of these can be set to 0 to disable the respective operation.

371 #

372 # If BlobTrashLifetime is zero, "trash" and "delete trash"

373 # happen at once, so only the lower of these two values is used.

374 BlobTrashConcurrency: 4

375 BlobDeleteConcurrency: 4

376

377 # Maximum number of concurrent "create additional replica of

378 # existing blob" operations conducted by a single keepstore

379 # process.

380 BlobReplicateConcurrency: 4

381

382 # Default replication level for collections. This is used when a

383 # collection's replication_desired attribute is nil.

384 DefaultReplication: 2

385

386 # BlobSigningTTL determines the minimum lifetime of transient

387 # data, i.e., blocks that are not referenced by

388 # collections. Unreferenced blocks exist for two reasons:

389 #

390 # 1) A data block must be written to a disk/cloud backend device

391 # before a collection can be created/updated with a reference to

392 # it.

393 #

394 # 2) Deleting or updating a collection can remove the last

395 # remaining reference to a data block.

396 #

397 # If BlobSigningTTL is too short, long-running

398 # processes/containers will fail when they take too long (a)

399 # between writing blocks and writing collections that reference

400 # them, or (b) between reading collections and reading the

401 # referenced blocks.

402 #

403 # If BlobSigningTTL is too long, data will still be stored long

404 # after the referring collections are deleted, and you will

405 # needlessly fill up disks or waste money on cloud storage.

406 #

407 # Modifying BlobSigningTTL invalidates existing signatures; see

408 # BlobSigningKey note above.

409 #

410 # The default is 2 weeks.

411 BlobSigningTTL: 336h

412

413 # When running keep-balance, this is the destination filename for

414 # the list of lost block hashes if there are any, one per line.

415 # Updated automically during each successful run.

416 BlobMissingReport: ""

417

418 # keep-balance operates periodically, i.e.: do a

419 # scan/balance operation, sleep, repeat.

420 #

421 # BalancePeriod determines the interval between start times of

422 # successive scan/balance operations. If a scan/balance operation

423 # takes longer than RunPeriod, the next one will follow it

424 # immediately.

425 #

426 # If SIGUSR1 is received during an idle period between operations,

427 # the next operation will start immediately.

428 BalancePeriod: 10m

429

430 # Limits the number of collections retrieved by keep-balance per

431 # API transaction. If this is zero, page size is

432 # determined by the API server's own page size limits (see

433 # API.MaxItemsPerResponse and API.MaxIndexDatabaseRead).

434 BalanceCollectionBatch: 0

435

436 # The size of keep-balance's internal queue of

437 # collections. Higher values use more memory and improve throughput

438 # by allowing keep-balance to fetch the next page of collections

439 # while the current page is still being processed. If this is zero

440 # or omitted, pages are processed serially.

441 BalanceCollectionBuffers: 1000

442

443 # Default lifetime for ephemeral collections: 2 weeks. This must not

444 # be less than BlobSigningTTL.

445 DefaultTrashLifetime: 336h

446

447 # Interval (seconds) between trash sweeps. During a trash sweep,

448 # collections are marked as trash if their trash_at time has

449 # arrived, and deleted if their delete_at time has arrived.

450 TrashSweepInterval: 60s

451

452 # If true, enable collection versioning.

453 # When a collection's preserve_version field is true or the current version

454 # is older than the amount of seconds defined on PreserveVersionIfIdle,

455 # a snapshot of the collection's previous state is created and linked to

456 # the current collection.

457 CollectionVersioning: false

458

459 # 0s = auto-create a new version on every update.

460 # -1s = never auto-create new versions.

461 # > 0s = auto-create a new version when older than the specified number of seconds.

462 PreserveVersionIfIdle: -1s

463

464 # If non-empty, allow project and collection names to contain

465 # the "/" character (slash/stroke/solidus), and replace "/" with

466 # the given string in the filesystem hierarchy presented by

467 # WebDAV. Example values are "%2f" and "{slash}". Names that

468 # contain the substitution string itself may result in confusing

469 # behavior, so a value like "_" is not recommended.

470 #

471 # If the default empty value is used, the server will reject

472 # requests to create or rename a collection when the new name

473 # contains "/".

474 #

475 # If the value "/" is used, project and collection names

476 # containing "/" will be allowed, but they will not be

477 # accessible via WebDAV.

478 #

479 # Use of this feature is not recommended, if it can be avoided.

480 ForwardSlashNameSubstitution: ""

481

482 # Managed collection properties. At creation time, if the client didn't

483 # provide the listed keys, they will be automatically populated following

484 # one of the following behaviors:

485 #

486 # * UUID of the user who owns the containing project.

487 # responsible_person_uuid: {Function: original_owner, Protected: true}

488 #

489 # * Default concrete value.

490 # foo_bar: {Value: baz, Protected: false}

491 #

492 # If Protected is true, only an admin user can modify its value.

493 ManagedProperties:

494 SAMPLE: {Function: original_owner, Protected: true}

495

496 # In "trust all content" mode, Workbench will redirect download

497 # requests to WebDAV preview link, even in the cases when

498 # WebDAV would have to expose XSS vulnerabilities in order to

499 # handle the redirect (see discussion on Services.WebDAV).

500 #

501 # This setting has no effect in the recommended configuration,

502 # where the WebDAV is configured to have a separate domain for

503 # every collection; in this case XSS protection is provided by

504 # browsers' same-origin policy.

505 #

506 # The default setting (false) is appropriate for a multi-user site.

507 TrustAllContent: false

508

509 # Cache parameters for WebDAV content serving:

510 # * TTL: Maximum time to cache manifests and permission checks.

511 # * UUIDTTL: Maximum time to cache collection state.

512 # * MaxBlockEntries: Maximum number of block cache entries.

513 # * MaxCollectionEntries: Maximum number of collection cache entries.

514 # * MaxCollectionBytes: Approximate memory limit for collection cache.

515 # * MaxPermissionEntries: Maximum number of permission cache entries.

516 # * MaxUUIDEntries: Maximum number of UUID cache entries.

517 WebDAVCache:

518 TTL: 300s

519 UUIDTTL: 5s

520 MaxBlockEntries: 4

521 MaxCollectionEntries: 1000

522 MaxCollectionBytes: 100000000

523 MaxPermissionEntries: 1000

524 MaxUUIDEntries: 1000

525

526 Login:

527 # One of the following mechanisms (SSO, Google, PAM, LDAP, or

528 # LoginCluster) should be enabled; see

529 # https://doc.arvados.org/install/setup-login.html

530

531 Google:

532 # Authenticate with Google.

533 Enable: false

534

535 # Use the Google Cloud console to enable the People API (APIs

536 # and Services > Enable APIs and services > Google People API

537 # > Enable), generate a Client ID and secret (APIs and

538 # Services > Credentials > Create credentials > OAuth client

539 # ID > Web application) and add your controller's /login URL

540 # (e.g., "https://zzzzz.example.com/login") as an authorized

541 # redirect URL.

542 #

543 # Incompatible with ForceLegacyAPI14. ProviderAppID must be

544 # blank.

545 ClientID: ""

546 ClientSecret: ""

547

548 # Allow users to log in to existing accounts using any verified

549 # email address listed by their Google account. If true, the

550 # Google People API must be enabled in order for Google login to

551 # work. If false, only the primary email address will be used.

552 AlternateEmailAddresses: true

553

554 PAM:

555 # (Experimental) Use PAM to authenticate users.

556 Enable: false

557

558 # PAM service name. PAM will apply the policy in the

559 # corresponding config file (e.g., /etc/pam.d/arvados) or, if

560 # there is none, the default "other" config.

561 Service: arvados

562

563 # Domain name (e.g., "example.com") to use to construct the

564 # user's email address if PAM authentication returns a

565 # username with no "@". If empty, use the PAM username as the

566 # user's email address, whether or not it contains "@".

567 #

568 # Note that the email address is used as the primary key for

569 # user records when logging in. Therefore, if you change

570 # PAMDefaultEmailDomain after the initial installation, you

571 # should also update existing user records to reflect the new

572 # domain. Otherwise, next time those users log in, they will

573 # be given new accounts instead of accessing their existing

574 # accounts.

575 DefaultEmailDomain: ""

576

577 LDAP:

578 # Use an LDAP service to authenticate users.

579 Enable: false

580

581 # Server URL, like "ldap://ldapserver.example.com:389" or

582 # "ldaps://ldapserver.example.com:636".

583 URL: "ldap://ldap:389"

584

585 # Use StartTLS upon connecting to the server.

586 StartTLS: true

587

588 # Skip TLS certificate name verification.

589 InsecureTLS: false

590

591 # Strip the @domain part if a user supplies an email-style

592 # username with this domain. If "*", strip any user-provided

593 # domain. If "", never strip the domain part. Example:

594 # "example.com"

595 StripDomain: ""

596

597 # If, after applying StripDomain, the username contains no "@"

598 # character, append this domain to form an email-style

599 # username. Example: "example.com"

600 AppendDomain: ""

601

602 # The LDAP attribute to filter on when looking up a username

603 # (after applying StripDomain and AppendDomain).

604 SearchAttribute: uid

605

606 # Bind with this username (DN or UPN) and password when

607 # looking up the user record.

608 #

609 # Example user: "cn=admin,dc=example,dc=com"

610 SearchBindUser: ""

611 SearchBindPassword: ""

612

613 # Directory base for username lookup. Example:

614 # "ou=Users,dc=example,dc=com"

615 SearchBase: ""

616

617 # Additional filters for username lookup. Special characters

618 # in assertion values must be escaped (see RFC4515). Example:

619 # "(objectClass=person)"

620 SearchFilters: ""

621

622 # LDAP attribute to use as the user's email address.

623 #

624 # Important: This must not be an attribute whose value can be

625 # edited in the directory by the users themselves. Otherwise,

626 # users can take over other users' Arvados accounts trivially

627 # (email address is the primary key for Arvados accounts.)

628 EmailAttribute: mail

629

630 # LDAP attribute to use as the preferred Arvados username. If

631 # no value is found (or this config is empty) the username

632 # originally supplied by the user will be used.

633 UsernameAttribute: uid

634

635 SSO:

636 # Authenticate with a separate SSO server. (Deprecated)

637 Enable: false

638

639 # ProviderAppID and ProviderAppSecret are generated during SSO

640 # setup; see

641 # https://doc.arvados.org/v2.0/install/install-sso.html#update-config

642 ProviderAppID: ""

643 ProviderAppSecret: ""

644

645 # The cluster ID to delegate the user database. When set,

646 # logins on this cluster will be redirected to the login cluster

647 # (login cluster must appear in RemoteClusters with Proxy: true)

648 LoginCluster: ""

649

650 # How long a cached token belonging to a remote cluster will

651 # remain valid before it needs to be revalidated.

652 RemoteTokenRefresh: 5m

653

654 Git:

655 # Path to git or gitolite-shell executable. Each authenticated

656 # request will execute this program with the single argument "http-backend"

657 GitCommand: /usr/bin/git

658

659 # Path to Gitolite's home directory. If a non-empty path is given,

660 # the CGI environment will be set up to support the use of

661 # gitolite-shell as a GitCommand: for example, if GitoliteHome is

662 # "/gh", then the CGI environment will have GITOLITE_HTTP_HOME=/gh,

663 # PATH=$PATH:/gh/bin, and GL_BYPASS_ACCESS_CHECKS=1.

664 GitoliteHome: ""

665

666 # Git repositories must be readable by api server, or you won't be

667 # able to submit crunch jobs. To pass the test suites, put a clone

668 # of the arvados tree in {git_repositories_dir}/arvados.git or

669 # {git_repositories_dir}/arvados/.git

670 Repositories: /var/lib/arvados/git/repositories

671

672 TLS:

673 Certificate: ""

674 Key: ""

675 Insecure: false

676

677 Containers:

678 # List of supported Docker Registry image formats that compute nodes

679 # are able to use. `arv keep docker` will error out if a user tries

680 # to store an image with an unsupported format. Use an empty array

681 # to skip the compatibility check (and display a warning message to

682 # that effect).

683 #

684 # Example for sites running docker < 1.10: {"v1": {}}

685 # Example for sites running docker >= 1.10: {"v2": {}}

686 # Example for disabling check: {}

687 SupportedDockerImageFormats:

688 "v2": {}

689 SAMPLE: {}

690

691 # Include details about job reuse decisions in the server log. This

692 # causes additional database queries to run, so it should not be

693 # enabled unless you expect to examine the resulting logs for

694 # troubleshooting purposes.

695 LogReuseDecisions: false

696

697 # Default value for keep_cache_ram of a container's runtime_constraints.

698 DefaultKeepCacheRAM: 268435456

699

700 # Number of times a container can be unlocked before being

701 # automatically cancelled.

702 MaxDispatchAttempts: 5

703

704 # Default value for container_count_max for container requests. This is the

705 # number of times Arvados will create a new container to satisfy a container

706 # request. If a container is cancelled it will retry a new container if

707 # container_count < container_count_max on any container requests associated

708 # with the cancelled container.

709 MaxRetryAttempts: 3

710

711 # The maximum number of compute nodes that can be in use simultaneously

712 # If this limit is reduced, any existing nodes with slot number >= new limit

713 # will not be counted against the new limit. In other words, the new limit

714 # won't be strictly enforced until those nodes with higher slot numbers

715 # go down.

716 MaxComputeVMs: 64

717

718 # Preemptible instance support (e.g. AWS Spot Instances)

719 # When true, child containers will get created with the preemptible

720 # scheduling parameter parameter set.

721 UsePreemptibleInstances: false

722

723 # PEM encoded SSH key (RSA, DSA, or ECDSA) used by the

724 # (experimental) cloud dispatcher for executing containers on

725 # worker VMs. Begins with "-----BEGIN RSA PRIVATE KEY-----\n"

726 # and ends with "\n-----END RSA PRIVATE KEY-----\n".

727 DispatchPrivateKey: ""

728

729 # Maximum time to wait for workers to come up before abandoning

730 # stale locks from a previous dispatch process.

731 StaleLockTimeout: 1m

732

733 # The crunch-run command to manage the container on a node

734 CrunchRunCommand: "crunch-run"

735

736 # Extra arguments to add to crunch-run invocation

737 # Example: ["--cgroup-parent-subsystem=memory"]

738 CrunchRunArgumentsList: []

739

740 # Extra RAM to reserve on the node, in addition to

741 # the amount specified in the container's RuntimeConstraints

742 ReserveExtraRAM: 256MiB

743

744 # Minimum time between two attempts to run the same container

745 MinRetryPeriod: 0s

746

747 Logging:

748 # When you run the db:delete_old_container_logs task, it will find

749 # containers that have been finished for at least this many seconds,

750 # and delete their stdout, stderr, arv-mount, crunch-run, and

751 # crunchstat logs from the logs table.

752 MaxAge: 720h

753

754 # These two settings control how frequently log events are flushed to the

755 # database. Log lines are buffered until either crunch_log_bytes_per_event

756 # has been reached or crunch_log_seconds_between_events has elapsed since

757 # the last flush.

758 LogBytesPerEvent: 4096

759 LogSecondsBetweenEvents: 5s

760

761 # The sample period for throttling logs.

762 LogThrottlePeriod: 60s

763

764 # Maximum number of bytes that job can log over crunch_log_throttle_period

765 # before being silenced until the end of the period.

766 LogThrottleBytes: 65536

767

768 # Maximum number of lines that job can log over crunch_log_throttle_period

769 # before being silenced until the end of the period.

770 LogThrottleLines: 1024

771

772 # Maximum bytes that may be logged by a single job. Log bytes that are

773 # silenced by throttling are not counted against this total.

774 LimitLogBytesPerJob: 67108864

775

776 LogPartialLineThrottlePeriod: 5s

777

778 # Container logs are written to Keep and saved in a

779 # collection, which is updated periodically while the

780 # container runs. This value sets the interval between

781 # collection updates.

782 LogUpdatePeriod: 30m

783

784 # The log collection is also updated when the specified amount of

785 # log data (given in bytes) is produced in less than one update

786 # period.

787 LogUpdateSize: 32MiB

788

789 SLURM:

790 PrioritySpread: 0

791 SbatchArgumentsList: []

792 SbatchEnvironmentVariables:

793 SAMPLE: ""

794 Managed:

795 # Path to dns server configuration directory

796 # (e.g. /etc/unbound.d/conf.d). If false, do not write any config

797 # files or touch restart.txt (see below).

798 DNSServerConfDir: ""

799

800 # Template file for the dns server host snippets. See

801 # unbound.template in this directory for an example. If false, do

802 # not write any config files.

803 DNSServerConfTemplate: ""

804

805 # String to write to {dns_server_conf_dir}/restart.txt (with a

806 # trailing newline) after updating local data. If false, do not

807 # open or write the restart.txt file.

808 DNSServerReloadCommand: ""

809

810 # Command to run after each DNS update. Template variables will be

811 # substituted; see the "unbound" example below. If false, do not run

812 # a command.

813 DNSServerUpdateCommand: ""

814

815 ComputeNodeDomain: ""

816 ComputeNodeNameservers:

817 "192.168.1.1": {}

818 SAMPLE: {}

819

820 # Hostname to assign to a compute node when it sends a "ping" and the

821 # hostname in its Node record is nil.

822 # During bootstrapping, the "ping" script is expected to notice the

823 # hostname given in the ping response, and update its unix hostname

824 # accordingly.

825 # If false, leave the hostname alone (this is appropriate if your compute

826 # nodes' hostnames are already assigned by some other mechanism).

827 #

828 # One way or another, the hostnames of your node records should agree

829 # with your DNS records and your /etc/slurm-llnl/slurm.conf files.

830 #

831 # Example for compute0000, compute0001, ....:

832 # assign_node_hostname: compute%<slot_number>04d

833 # (See http://ruby-doc.org/core-2.2.2/Kernel.html#method-i-format for more.)

834 AssignNodeHostname: "compute%<slot_number>d"

835

836 JobsAPI:

837 # Enable the legacy 'jobs' API (crunch v1). This value must be a string.

838 #

839 # Note: this only enables read-only access, creating new

840 # legacy jobs and pipelines is not supported.

841 #

842 # 'auto' -- (default) enable the Jobs API only if it has been used before

843 # (i.e., there are job records in the database)

844 # 'true' -- enable the Jobs API despite lack of existing records.

845 # 'false' -- disable the Jobs API despite presence of existing records.

846 Enable: 'auto'

847

848 # Git repositories must be readable by api server, or you won't be

849 # able to submit crunch jobs. To pass the test suites, put a clone

850 # of the arvados tree in {git_repositories_dir}/arvados.git or

851 # {git_repositories_dir}/arvados/.git

852 GitInternalDir: /var/lib/arvados/internal.git

853

854 CloudVMs:

855 # Enable the cloud scheduler (experimental).

856 Enable: false

857

858 # Name/number of port where workers' SSH services listen.

859 SSHPort: "22"

860

861 # Interval between queue polls.

862 PollInterval: 10s

863

864 # Shell command to execute on each worker to determine whether

865 # the worker is booted and ready to run containers. It should

866 # exit zero if the worker is ready.

867 BootProbeCommand: "docker ps -q"

868

869 # Minimum interval between consecutive probes to a single

870 # worker.

871 ProbeInterval: 10s

872

873 # Maximum probes per second, across all workers in a pool.

874 MaxProbesPerSecond: 10

875

876 # Time before repeating SIGTERM when killing a container.

877 TimeoutSignal: 5s

878

879 # Time to give up on SIGTERM and write off the worker.

880 TimeoutTERM: 2m

881

882 # Maximum create/destroy-instance operations per second (0 =

883 # unlimited).

884 MaxCloudOpsPerSecond: 0

885

886 # Interval between cloud provider syncs/updates ("list all

887 # instances").

888 SyncInterval: 1m

889

890 # Time to leave an idle worker running (in case new containers

891 # appear in the queue that it can run) before shutting it

892 # down.

893 TimeoutIdle: 1m

894

895 # Time to wait for a new worker to boot (i.e., pass

896 # BootProbeCommand) before giving up and shutting it down.

897 TimeoutBooting: 10m

898

899 # Maximum time a worker can stay alive with no successful

900 # probes before being automatically shut down.

901 TimeoutProbe: 10m

902

903 # Time after shutting down a worker to retry the

904 # shutdown/destroy operation.

905 TimeoutShutdown: 10s

906

907 # Worker VM image ID.

908 ImageID: ""

909

910 # An executable file (located on the dispatcher host) to be

911 # copied to cloud instances at runtime and used as the

912 # container runner/supervisor. The default value is the

913 # dispatcher program itself.

914 #

915 # Use the empty string to disable this step: nothing will be

916 # copied, and cloud instances are assumed to have a suitable

917 # version of crunch-run installed.

918 DeployRunnerBinary: "/proc/self/exe"

919

920 # Tags to add on all resources (VMs, NICs, disks) created by

921 # the container dispatcher. (Arvados's own tags --

922 # InstanceType, IdleBehavior, and InstanceSecret -- will also

923 # be added.)

924 ResourceTags:

925 SAMPLE: "tag value"

926

927 # Prefix for predefined tags used by Arvados (InstanceSetID,

928 # InstanceType, InstanceSecret, IdleBehavior). With the

929 # default value "Arvados", tags are "ArvadosInstanceSetID",

930 # "ArvadosInstanceSecret", etc.

931 #

932 # This should only be changed while no cloud resources are in

933 # use and the cloud dispatcher is not running. Otherwise,

934 # VMs/resources that were added using the old tag prefix will

935 # need to be detected and cleaned up manually.

936 TagKeyPrefix: Arvados

937

938 # Cloud driver: "azure" (Microsoft Azure) or "ec2" (Amazon AWS).

939 Driver: ec2

940

941 # Cloud-specific driver parameters.

942 DriverParameters:

943

944 # (ec2) Credentials.

945 AccessKeyID: ""

946 SecretAccessKey: ""

947

948 # (ec2) Instance configuration.

949 SecurityGroupIDs:

950 "SAMPLE": {}

951 SubnetID: ""

952 Region: ""

953 EBSVolumeType: gp2

954 AdminUsername: debian

955

956 # (azure) Credentials.

957 SubscriptionID: ""

958 ClientID: ""

959 ClientSecret: ""

960 TenantID: ""

961

962 # (azure) Instance configuration.

963 CloudEnvironment: AzurePublicCloud

964 ResourceGroup: ""

965 Location: centralus

966 Network: ""

967 Subnet: ""

968 StorageAccount: ""

969 BlobContainer: ""

970 DeleteDanglingResourcesAfter: 20s

971 AdminUsername: arvados

972

973 InstanceTypes:

974

975 # Use the instance type name as the key (in place of "SAMPLE" in

976 # this sample entry).

977 SAMPLE:

978 # Cloud provider's instance type. Defaults to the configured type name.

979 ProviderType: ""

980 VCPUs: 1

981 RAM: 128MiB

982 IncludedScratch: 16GB

983 AddedScratch: 0

984 Price: 0.1

985 Preemptible: false

986

987 Volumes:

988 SAMPLE:

989 # AccessViaHosts specifies which keepstore processes can read

990 # and write data on the volume.

991 #

992 # For a local filesystem, AccessViaHosts has one entry,

993 # indicating which server the filesystem is located on.

994 #

995 # For a network-attached backend accessible by all keepstore

996 # servers, like a cloud storage bucket or an NFS mount,

997 # AccessViaHosts can be empty/omitted.

998 #

999 # Further info/examples:

1000 # https://doc.arvados.org/install/configure-fs-storage.html

1001 # https://doc.arvados.org/install/configure-s3-object-storage.html

1002 # https://doc.arvados.org/install/configure-azure-blob-storage.html

1003 AccessViaHosts:

1004 SAMPLE:

1005 ReadOnly: false

1006 "http://host1.example:25107": {}

1007 ReadOnly: false

1008 Replication: 1

1009 StorageClasses:

1010 default: true

1011 SAMPLE: true

1012 Driver: s3

1013 DriverParameters:

1014 # for s3 driver -- see

1015 # https://doc.arvados.org/install/configure-s3-object-storage.html

1016 IAMRole: aaaaa

1017 AccessKey: aaaaa

1018 SecretKey: aaaaa

1019 Endpoint: ""

1020 Region: us-east-1a

1021 Bucket: aaaaa

1022 LocationConstraint: false

1023 IndexPageSize: 1000

1024 ConnectTimeout: 1m

1025 ReadTimeout: 10m

1026 RaceWindow: 24h

1027

1028 # For S3 driver, potentially unsafe tuning parameter,

1029 # intentionally excluded from main documentation.

1030 #

1031 # Enable deletion (garbage collection) even when the

1032 # configured BlobTrashLifetime is zero. WARNING: eventual

1033 # consistency may result in race conditions that can cause

1034 # data loss. Do not enable this unless you understand and

1035 # accept the risk.

1036 UnsafeDelete: false

1037

1038 # for azure driver -- see

1039 # https://doc.arvados.org/install/configure-azure-blob-storage.html

1040 StorageAccountName: aaaaa

1041 StorageAccountKey: aaaaa

1042 StorageBaseURL: core.windows.net

1043 ContainerName: aaaaa

1044 RequestTimeout: 30s

1045 ListBlobsRetryDelay: 10s

1046 ListBlobsMaxAttempts: 10

1047 MaxGetBytes: 0

1048 WriteRaceInterval: 15s

1049 WriteRacePollTime: 1s

1050

1051 # for local directory driver -- see

1052 # https://doc.arvados.org/install/configure-fs-storage.html

1053 Root: /var/lib/arvados/keep-data

1054

1055 # For local directory driver, potentially confusing tuning

1056 # parameter, intentionally excluded from main documentation.

1057 #

1058 # When true, read and write operations (for whole 64MiB

1059 # blocks) on an individual volume will queued and issued

1060 # serially. When false, read and write operations will be

1061 # issued concurrently.

1062 #

1063 # May possibly improve throughput if you have physical spinning disks

1064 # and experience contention when there are multiple requests

1065 # to the same volume.

1066 #

1067 # Otherwise, when using SSDs, RAID, or a shared network filesystem, you

1068 # should leave this alone.

1069 Serialize: false

1070

1071 Mail:

1072 MailchimpAPIKey: ""

1073 MailchimpListID: ""

1074 SendUserSetupNotificationEmail: true

1075

1076 # Bug/issue report notification to and from addresses

1077 IssueReporterEmailFrom: "arvados@example.com"

1078 IssueReporterEmailTo: "arvados@example.com"

1079 SupportEmailAddress: "arvados@example.com"

1080

1081 # Generic issue email from

1082 EmailFrom: "arvados@example.com"

1083 RemoteClusters:

1084 "*":

1085 Host: ""

1086 Proxy: false

1087 Scheme: https

1088 Insecure: false

1089 ActivateUsers: false

1090 SAMPLE:

1091 # API endpoint host or host:port; default is {id}.arvadosapi.com

1092 Host: sample.arvadosapi.com

1093

1094 # Perform a proxy request when a local client requests an

1095 # object belonging to this remote.

1096 Proxy: false

1097

1098 # Default "https". Can be set to "http" for testing.

1099 Scheme: https

1100

1101 # Disable TLS verify. Can be set to true for testing.

1102 Insecure: false

1103

1104 # When users present tokens issued by this remote cluster, and

1105 # their accounts are active on the remote cluster, activate

1106 # them on this cluster too.

1107 ActivateUsers: false

1108

1109 Workbench:

1110 # Workbench1 configs

1111 Theme: default

1112 ActivationContactLink: mailto:info@arvados.org

1113 ArvadosDocsite: https://doc.arvados.org

1114 ArvadosPublicDataDocURL: https://playground.arvados.org/projects/public

1115 ShowUserAgreementInline: false

1116 SecretKeyBase: ""

1117

1118 # Scratch directory used by the remote repository browsing

1119 # feature. If it doesn't exist, it (and any missing parents) will be

1120 # created using mkdir_p.

1121 RepositoryCache: /var/www/arvados-workbench/current/tmp/git

1122

1123 # Below is a sample setting of user_profile_form_fields config parameter.

1124 # This configuration parameter should be set to either false (to disable) or

1125 # to a map as shown below.

1126 # Configure the map of input fields to be displayed in the profile page

1127 # using the attribute "key" for each of the input fields.

1128 # This sample shows configuration with one required and one optional form fields.

1129 # For each of these input fields:

1130 # You can specify "Type" as "text" or "select".

1131 # List the "Options" to be displayed for each of the "select" menu.

1132 # Set "Required" as "true" for any of these fields to make them required.

1133 # If any of the required fields are missing in the user's profile, the user will be

1134 # redirected to the profile page before they can access any Workbench features.

1135 UserProfileFormFields:

1136 SAMPLE:

1137 Type: select

1138 FormFieldTitle: Best color

1139 FormFieldDescription: your favorite color

1140 Required: false

1141 Position: 1

1142 Options:

1143 red: {}

1144 blue: {}

1145 green: {}

1146 SAMPLE: {}

1147

1148 # exampleTextValue: # key that will be set in properties

1149 # Type: text #

1150 # FormFieldTitle: ""

1151 # FormFieldDescription: ""

1152 # Required: true

1153 # Position: 1

1154 # exampleOptionsValue:

1155 # Type: select

1156 # FormFieldTitle: ""

1157 # FormFieldDescription: ""

1158 # Required: true

1159 # Position: 1

1160 # Options:

1161 # red: {}

1162 # blue: {}

1163 # yellow: {}

1164

1165 # Use "UserProfileFormMessage to configure the message you want

1166 # to display on the profile page.

1167 UserProfileFormMessage: 'Welcome to Arvados. All <span style="color:red">required fields</span> must be completed before you can proceed.'

1168

1169 # Mimetypes of applications for which the view icon

1170 # would be enabled in a collection's show page.

1171 # It is sufficient to list only applications here.

1172 # No need to list text and image types.

1173 ApplicationMimetypesWithViewIcon:

1174 cwl: {}

1175 fasta: {}

1176 go: {}

1177 javascript: {}

1178 json: {}

1179 pdf: {}

1180 python: {}

1181 x-python: {}

1182 r: {}

1183 rtf: {}

1184 sam: {}

1185 x-sh: {}

1186 vnd.realvnc.bed: {}

1187 xml: {}

1188 xsl: {}

1189 SAMPLE: {}

1190

1191 # The maximum number of bytes to load in the log viewer

1192 LogViewerMaxBytes: 1M

1193

1194 # When anonymous_user_token is configured, show public projects page

1195 EnablePublicProjectsPage: true

1196

1197 # By default, disable the "Getting Started" popup which is specific to Arvados playground

1198 EnableGettingStartedPopup: false

1199

1200 # Ask Arvados API server to compress its response payloads.

1201 APIResponseCompression: true

1202

1203 # Timeouts for API requests.

1204 APIClientConnectTimeout: 2m

1205 APIClientReceiveTimeout: 5m

1206

1207 # Maximum number of historic log records of a running job to fetch

1208 # and display in the Log tab, while subscribing to web sockets.

1209 RunningJobLogRecordsToFetch: 2000

1210

1211 # In systems with many shared projects, loading of dashboard and topnav

1212 # can be slow due to collections indexing; use the following parameters

1213 # to suppress these properties

1214 ShowRecentCollectionsOnDashboard: true

1215 ShowUserNotifications: true

1216

1217 # Enable/disable "multi-site search" in top nav ("true"/"false"), or

1218 # a link to the multi-site search page on a "home" Workbench site.

1219 #

1220 # Example:

1221 # https://workbench.qr1hi.arvadosapi.com/collections/multisite

1222 MultiSiteSearch: ""

1223

1224 # Should workbench allow management of local git repositories? Set to false if

1225 # the jobs api is disabled and there are no local git repositories.

1226 Repositories: true

1227

1228 SiteName: Arvados Workbench

1229 ProfilingEnabled: false

1230

1231 # This is related to obsolete Google OpenID 1.0 login

1232 # but some workbench stuff still expects it to be set.

1233 DefaultOpenIdPrefix: "https://www.google.com/accounts/o8/id"

1234

1235 # Workbench2 configs

1236 VocabularyURL: ""

1237 FileViewersConfigURL: ""

1238

1239 # Workbench welcome screen, this is HTML text that will be

1240 # incorporated directly onto the page.

1241 WelcomePageHTML: |

1242 <img src="/arvados-logo-big.png" style="width: 20%; float: right; padding: 1em;" />

1243 <h2>Please log in.</h2>

1244

1245 <p>The "Log in" button below will show you a sign-in

1246 page. After you log in, you will be redirected back to

1247 Arvados Workbench.</p>

1248

1249 <p>If you have never used Arvados Workbench before, logging in

1250 for the first time will automatically create a new

1251 account.</p>

1252

1253 <i>Arvados Workbench uses your name and email address only for

1254 identification, and does not retrieve any other personal

1255 information.</i>

1256

1257 # Workbench screen displayed to inactive users. This is HTML

1258 # text that will be incorporated directly onto the page.

1259 InactivePageHTML: |

1260 <img src="/arvados-logo-big.png" style="width: 20%; float: right; padding: 1em;" />

1261 <h3>Hi! You're logged in, but...</h3>

1262 <p>Your account is inactive.</p>

1263 <p>An administrator must activate your account before you can get

1264 any further.</p>

1265

1266 # Connecting to Arvados shell VMs tends to be site-specific.

1267 # Put any special instructions here. This is HTML text that will

1268 # be incorporated directly onto the Workbench page.

1269 SSHHelpPageHTML: |

1270 <a href="https://doc.arvados.org/user/getting_started/ssh-access-unix.html">Accessing an Arvados VM with SSH</a> (generic instructions).

1271 Site configurations vary. Contact your local cluster administrator if you have difficulty accessing an Arvados shell node.

1272

1273 # Sample text if you are using a "switchyard" ssh proxy.

1274 # Replace "zzzzz" with your Cluster ID.

1275 #SSHHelpPageHTML: |

1276 # <p>Add a section like this to your SSH configuration file ( <i>~/.ssh/config</i>):</p>

1277 # <pre>Host *.zzzzz

1278 # TCPKeepAlive yes

1279 # ServerAliveInterval 60

1280 # ProxyCommand ssh -p2222 turnout@switchyard.zzzzz.arvadosapi.com -x -a $SSH_PROXY_FLAGS %h

1281 # </pre>

1282

1283 # If you are using a switchyard ssh proxy, shell node hostnames

1284 # may require a special hostname suffix. In the sample ssh

1285 # configuration above, this would be ".zzzzz"

1286 # This is added to the hostname in the "command line" column

1287 # the Workbench "shell VMs" page.

1288 #

1289 # If your shell nodes are directly accessible by users without a

1290 # proxy and have fully qualified host names, you should leave

1291 # this blank.

1292 SSHHelpHostSuffix: ""

1293

1294 # Bypass new (Arvados 1.5) API implementations, and hand off

1295 # requests directly to Rails instead. This can provide a temporary

1296 # workaround for clients that are incompatible with the new API

1297 # implementation. Note that it also disables some new federation

1298 # features and will be removed in a future release.

1299 ForceLegacyAPI14: false

1300

1301 # (Experimental) Restart services automatically when config file

1302 # changes are detected. Only supported by `arvados-server boot` in

1303 # dev/test mode.

1304 AutoReloadConfig: false