X-Git-Url: https://git.arvados.org/arvados.git/blobdiff_plain/83d08d7ccbc622ec97948929c83fb91f96743ca2..6fe8e52020d421797306e5c6536afbcee761510a:/services/nodemanager/arvnodeman/computenode/dispatch/__init__.py diff --git a/services/nodemanager/arvnodeman/computenode/dispatch/__init__.py b/services/nodemanager/arvnodeman/computenode/dispatch/__init__.py index 9106ea67cc..b4fec5096d 100644 --- a/services/nodemanager/arvnodeman/computenode/dispatch/__init__.py +++ b/services/nodemanager/arvnodeman/computenode/dispatch/__init__.py @@ -130,7 +130,7 @@ class ComputeNodeSetupActor(ComputeNodeStateChangeBase): @RetryMixin._retry() def create_cloud_node(self): self._logger.info("Sending create_node request for node size %s.", - self.cloud_size.name) + self.cloud_size.id) try: self.cloud_node = self._cloud.create_node(self.cloud_size, self.arvados_node) @@ -432,6 +432,11 @@ class ComputeNodeMonitorActor(config.actor_class): reason for the decision. """ + # If this node's size is invalid (because it has a stale arvados_node_size + # tag), return True so that it's properly shut down. + if self.cloud_node.size.id == 'invalid': + return (True, "node's size tag '%s' not recognizable" % (self.cloud_node.extra['arvados_node_size'],)) + # Collect states and then consult state transition table whether we # should shut down. Possible states are: # crunch_worker_state = ['unpaired', 'busy', 'idle', 'down']