X-Git-Url: https://git.arvados.org/arvados.git/blobdiff_plain/d3229c7f727f40436cad66fba5f3345e0b3eede5..f7e3001b53e9f26fd1d413308093bb9700bb9287:/services/nodemanager/doc/ec2.example.cfg?ds=sidebyside diff --git a/services/nodemanager/doc/ec2.example.cfg b/services/nodemanager/doc/ec2.example.cfg index f4b27af701..024ed2b59b 100644 --- a/services/nodemanager/doc/ec2.example.cfg +++ b/services/nodemanager/doc/ec2.example.cfg @@ -2,6 +2,11 @@ # All times are in seconds unless specified otherwise. [Daemon] +# The dispatcher can customize the start and stop procedure for +# cloud nodes. For example, the SLURM dispatcher drains nodes +# through SLURM before shutting them down. +#dispatcher = slurm + # Node Manager will ensure that there are at least this many nodes # running at all times. min_nodes = 0 @@ -22,6 +27,12 @@ max_poll_time = 300 # information is too outdated. poll_stale_after = 600 +# If Node Manager boots a cloud node, and it does not pair with an Arvados +# node before this long, assume that there was a cloud bootstrap failure and +# shut it down. Note that normal shutdown windows apply (see the Cloud +# section), so this should be shorter than the first shutdown window value. +boot_fail_after = 1800 + # "Node stale time" affects two related behaviors. # 1. If a compute node has been running for at least this long, but it # isn't paired with an Arvados node, do not shut it down, but leave it alone.