Merge "Avoid handling a deploy failure twice"

This commit is contained in:
Zuul 2021-11-09 15:12:52 +00:00 committed by Gerrit Code Review
commit 188a3bbfc4
3 changed files with 57 additions and 28 deletions

View File

@ -265,6 +265,16 @@ def do_next_deploy_step(task, step_index):
{'step': step, 'node': node.uuid}) {'step': step, 'node': node.uuid})
try: try:
result = interface.execute_deploy_step(task, step) result = interface.execute_deploy_step(task, step)
except exception.AgentInProgress as e:
LOG.info('Conductor attempted to process deploy step for '
'node %(node)s. Agent indicated it is presently '
'executing a command. Error: %(error)s',
{'node': task.node.uuid,
'error': e})
driver_internal_info['skip_current_deploy_step'] = False
node.driver_internal_info = driver_internal_info
task.process_event('wait')
return
except exception.IronicException as e: except exception.IronicException as e:
if isinstance(e, exception.AgentConnectionFailed): if isinstance(e, exception.AgentConnectionFailed):
if task.node.driver_internal_info.get('deployment_reboot'): if task.node.driver_internal_info.get('deployment_reboot'):
@ -276,23 +286,17 @@ def do_next_deploy_step(task, step_index):
node.driver_internal_info = driver_internal_info node.driver_internal_info = driver_internal_info
task.process_event('wait') task.process_event('wait')
return return
if isinstance(e, exception.AgentInProgress):
LOG.info('Conductor attempted to process deploy step for ' # Avoid double handling of failures. For example, set_failed_state
'node %(node)s. Agent indicated it is presently ' # from deploy_utils already calls deploying_error_handler.
'executing a command. Error: %(error)s', if task.node.provision_state != states.DEPLOYFAIL:
{'node': task.node.uuid, log_msg = ('Node %(node)s failed deploy step %(step)s. Error: '
'error': e}) '%(err)s' % {'node': node.uuid,
driver_internal_info['skip_current_deploy_step'] = False 'step': node.deploy_step, 'err': e})
node.driver_internal_info = driver_internal_info utils.deploying_error_handler(
task.process_event('wait') task, log_msg,
return _("Deploy step %(step)s failed: %(err)s.")
log_msg = ('Node %(node)s failed deploy step %(step)s. Error: ' % {'step': conductor_steps.step_id(step), 'err': e})
'%(err)s' %
{'node': node.uuid, 'step': node.deploy_step, 'err': e})
utils.deploying_error_handler(
task, log_msg,
_("Deploy step %(step)s failed: %(err)s.")
% {'step': conductor_steps.step_id(step), 'err': e})
return return
except Exception as e: except Exception as e:
log_msg = ('Node %(node)s failed deploy step %(step)s with ' log_msg = ('Node %(node)s failed deploy step %(step)s with '
@ -300,7 +304,10 @@ def do_next_deploy_step(task, step_index):
{'node': node.uuid, 'step': node.deploy_step, 'err': e}) {'node': node.uuid, 'step': node.deploy_step, 'err': e})
utils.deploying_error_handler( utils.deploying_error_handler(
task, log_msg, task, log_msg,
_("Failed to deploy. Exception: %s") % e, traceback=True) _("Deploy step %(step)s failed with %(exc)s: %(err)s.")
% {'step': conductor_steps.step_id(step), 'err': e,
'exc': e.__class__.__name__},
traceback=True)
return return
if task.node.provision_state == states.DEPLOYFAIL: if task.node.provision_state == states.DEPLOYFAIL:

View File

@ -292,6 +292,15 @@ def log_and_raise_deployment_error(task, msg, collect_logs=True, exc=None):
""" """
log_traceback = (exc is not None log_traceback = (exc is not None
and not isinstance(exc, exception.IronicException)) and not isinstance(exc, exception.IronicException))
# Replicate the logic in do_next_deploy_step to prepend the current step
step_id = (conductor_steps.step_id(task.node.deploy_step)
if task.node.deploy_step else None)
if step_id and step_id not in msg:
msg = _("Deploy step %(step)s failed: %(err)s") % {
'step': step_id, 'err': msg
}
LOG.error(msg, exc_info=log_traceback) LOG.error(msg, exc_info=log_traceback)
deploy_utils.set_failed_state(task, msg, collect_logs=collect_logs) deploy_utils.set_failed_state(task, msg, collect_logs=collect_logs)
raise exception.InstanceDeployFailure(msg) raise exception.InstanceDeployFailure(msg)

View File

@ -111,9 +111,9 @@ class DoNodeDeployTestCase(mgr_utils.ServiceSetUpMixin, db_base.DbTestCase):
self.assertEqual(states.ACTIVE, node.target_provision_state) self.assertEqual(states.ACTIVE, node.target_provision_state)
self.assertIsNotNone(node.last_error) self.assertIsNotNone(node.last_error)
if unexpected: if unexpected:
self.assertIn('Exception', node.last_error) self.assertIn(exc.__class__.__name__, node.last_error)
else: else:
self.assertNotIn('Exception', node.last_error) self.assertNotIn(exc.__class__.__name__, node.last_error)
mock_deploy.assert_called_once_with(mock.ANY, task) mock_deploy.assert_called_once_with(mock.ANY, task)
@ -636,20 +636,23 @@ class DoNextDeployStepTestCase(mgr_utils.ServiceSetUpMixin,
@mock.patch.object(conductor_utils, 'LOG', autospec=True) @mock.patch.object(conductor_utils, 'LOG', autospec=True)
@mock.patch('ironic.drivers.modules.fake.FakeDeploy.execute_deploy_step', @mock.patch('ironic.drivers.modules.fake.FakeDeploy.execute_deploy_step',
autospec=True) autospec=True)
def _do_next_deploy_step_execute_fail(self, exc, traceback, def _do_next_deploy_step_execute_fail(self, exc, traceback, handled,
mock_execute, mock_log): mock_execute, mock_log):
# When a deploy step fails, go to DEPLOYFAIL # When a deploy step fails, go to DEPLOYFAIL
driver_internal_info = {'deploy_step_index': None, driver_internal_info = {'deploy_step_index': None,
'deploy_steps': self.deploy_steps} 'deploy_steps': self.deploy_steps}
self._start_service() self._start_service()
node = obj_utils.create_test_node( node = obj_utils.create_test_node(
self.context, driver='fake-hardware', self.context, driver='fake-hardware',
driver_internal_info=driver_internal_info, driver_internal_info=driver_internal_info,
provision_state=states.DEPLOYFAIL if handled else states.DEPLOYING,
target_provision_state=states.ACTIVE,
last_error='existing error' if handled else None,
deploy_step={}) deploy_step={})
mock_execute.side_effect = exc mock_execute.side_effect = exc
task = task_manager.TaskManager(self.context, node.uuid) task = task_manager.TaskManager(self.context, node.uuid)
task.process_event('deploy')
deployments.do_next_deploy_step(task, 0) deployments.do_next_deploy_step(task, 0)
@ -657,20 +660,30 @@ class DoNextDeployStepTestCase(mgr_utils.ServiceSetUpMixin,
node.refresh() node.refresh()
self.assertEqual(states.DEPLOYFAIL, node.provision_state) self.assertEqual(states.DEPLOYFAIL, node.provision_state)
self.assertEqual(states.ACTIVE, node.target_provision_state) self.assertEqual(states.ACTIVE, node.target_provision_state)
self.assertEqual({}, node.deploy_step) if handled:
self.assertNotIn('deploy_step_index', node.driver_internal_info) self.assertEqual('existing error', node.last_error)
self.assertIsNotNone(node.last_error) else:
self.assertEqual({}, node.deploy_step)
self.assertNotIn('deploy_step_index', node.driver_internal_info)
self.assertIsNotNone(node.last_error)
self.assertIn(f"Deploy step deploy.{self.deploy_steps[0]['step']}",
node.last_error)
mock_log.error.assert_called_once_with(mock.ANY,
exc_info=traceback)
self.assertFalse(node.maintenance) self.assertFalse(node.maintenance)
mock_execute.assert_called_once_with(mock.ANY, mock.ANY, mock_execute.assert_called_once_with(mock.ANY, mock.ANY,
self.deploy_steps[0]) self.deploy_steps[0])
mock_log.error.assert_called_once_with(mock.ANY, exc_info=traceback)
def test_do_next_deploy_step_execute_ironic_exception(self): def test_do_next_deploy_step_execute_ironic_exception(self):
self._do_next_deploy_step_execute_fail( self._do_next_deploy_step_execute_fail(
exception.IronicException('foo'), False) exception.IronicException('foo'), False, False)
def test_do_next_deploy_step_execute_exception(self): def test_do_next_deploy_step_execute_exception(self):
self._do_next_deploy_step_execute_fail(Exception('foo'), True) self._do_next_deploy_step_execute_fail(Exception('foo'), True, False)
def test_do_next_deploy_step_execute_handled_exception(self):
self._do_next_deploy_step_execute_fail(
exception.IronicException('foo'), False, True)
@mock.patch('ironic.drivers.modules.fake.FakeDeploy.execute_deploy_step', @mock.patch('ironic.drivers.modules.fake.FakeDeploy.execute_deploy_step',
autospec=True) autospec=True)