X-Git-Url: https://git.arvados.org/arvados.git/blobdiff_plain/800816a9888ac843381c08b266d607b98945cdb8..3a0aa1db801154916f50b1b299d5100945a3e1df:/services/nodemanager/arvnodeman/launcher.py diff --git a/services/nodemanager/arvnodeman/launcher.py b/services/nodemanager/arvnodeman/launcher.py index c8b3d19485..1be7e46387 100644 --- a/services/nodemanager/arvnodeman/launcher.py +++ b/services/nodemanager/arvnodeman/launcher.py @@ -12,6 +12,7 @@ import daemon import pykka from . import config as nmconfig +from .baseactor import WatchdogActor from .daemon import NodeManagerDaemonActor from .jobqueue import JobQueueMonitorActor, ServerCalculator from .nodelist import ArvadosNodeListMonitorActor, CloudNodeListMonitorActor @@ -69,14 +70,14 @@ def launch_pollers(config, server_calculator): poll_time = config.getint('Daemon', 'poll_time') max_poll_time = config.getint('Daemon', 'max_poll_time') - timer = TimedCallBackActor.start(poll_time / 10.0).proxy() + timer = TimedCallBackActor.start(poll_time / 10.0).tell_proxy() cloud_node_poller = CloudNodeListMonitorActor.start( - config.new_cloud_client(), timer, poll_time, max_poll_time).proxy() + config.new_cloud_client(), timer, poll_time, max_poll_time).tell_proxy() arvados_node_poller = ArvadosNodeListMonitorActor.start( - config.new_arvados_client(), timer, poll_time, max_poll_time).proxy() + config.new_arvados_client(), timer, poll_time, max_poll_time).tell_proxy() job_queue_poller = JobQueueMonitorActor.start( config.new_arvados_client(), timer, server_calculator, - poll_time, max_poll_time).proxy() + poll_time, max_poll_time).tell_proxy() return timer, cloud_node_poller, arvados_node_poller, job_queue_poller _caught_signals = {} @@ -110,7 +111,7 @@ def main(args=None): server_calculator = build_server_calculator(config) timer, cloud_node_poller, arvados_node_poller, job_queue_poller = \ launch_pollers(config, server_calculator) - cloud_node_updater = node_update.start(config.new_cloud_client).proxy() + cloud_node_updater = node_update.start(config.new_cloud_client).tell_proxy() node_daemon = NodeManagerDaemonActor.start( job_queue_poller, arvados_node_poller, cloud_node_poller, cloud_node_updater, timer, @@ -123,7 +124,13 @@ def main(args=None): config.getint('Daemon', 'boot_fail_after'), config.getint('Daemon', 'node_stale_after'), node_setup, node_shutdown, node_monitor, - max_total_price=config.getfloat('Daemon', 'max_total_price')).proxy() + max_total_price=config.getfloat('Daemon', 'max_total_price')).tell_proxy() + + WatchdogActor.start(config.getint('Daemon', 'watchdog'), + cloud_node_poller.actor_ref, + arvados_node_poller.actor_ref, + job_queue_poller.actor_ref, + node_daemon.actor_ref) signal.pause() daemon_stopped = node_daemon.actor_ref.actor_stopped.is_set