
While flow is in REVERTING or REVERTED state, reverted tasks are now left in REVERTED state. They are then reset to PENDING state when flow is run again. With this change: - when task is in REVERTED state, its result (if task were successfully executed before) is removed, but its failure (if its execution or reversion failed) is still available from storage; - when flow is in REVERTED or FAILURE states, you can get all task failures from storage; - if flow is in REVERTED or REVERTING state, but task is in PENDING state, it means this task was never executed; - flow cannot transition from REVERTED to RUNNING state any more -- it should go through PENDING state; on REVERTED -> PENDING transition tasks of the flow are reset. This ensures that failure information is available until it becomes irrelevant. Closes-bug: #1246612 Change-Id: I27c3891f5d412d6de6240638b5014afda94a58a4
264 lines
9.8 KiB
Python
264 lines
9.8 KiB
Python
# -*- coding: utf-8 -*-
|
|
|
|
# vim: tabstop=4 shiftwidth=4 softtabstop=4
|
|
|
|
# Copyright (C) 2012 Yahoo! Inc. All Rights Reserved.
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License"); you may
|
|
# not use this file except in compliance with the License. You may obtain
|
|
# a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
|
|
# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
|
|
# License for the specific language governing permissions and limitations
|
|
# under the License.
|
|
|
|
import threading
|
|
|
|
from concurrent import futures
|
|
|
|
from taskflow.engines.action_engine import graph_action
|
|
from taskflow.engines.action_engine import task_action
|
|
from taskflow.engines import base
|
|
|
|
from taskflow import exceptions as exc
|
|
from taskflow.openstack.common import excutils
|
|
from taskflow.openstack.common import uuidutils
|
|
from taskflow import states
|
|
from taskflow import storage as t_storage
|
|
|
|
from taskflow.utils import flow_utils
|
|
from taskflow.utils import lock_utils
|
|
from taskflow.utils import misc
|
|
from taskflow.utils import reflection
|
|
from taskflow.utils import threading_utils
|
|
|
|
|
|
class ActionEngine(base.EngineBase):
|
|
"""Generic action-based engine.
|
|
|
|
This engine flattens the flow (and any subflows) into a execution graph
|
|
which contains the full runtime definition to be executed and then uses
|
|
this graph in combination with the action classes & storage to attempt to
|
|
run your flow (and any subflows & contained tasks) to completion.
|
|
|
|
During this process it is permissible and valid to have a task or multiple
|
|
tasks in the execution graph fail, which will cause the process of
|
|
reversion to commence. See the valid states in the states module to learn
|
|
more about what other states the tasks & flow being ran can go through.
|
|
"""
|
|
_graph_action = None
|
|
|
|
def __init__(self, flow, flow_detail, backend, conf):
|
|
super(ActionEngine, self).__init__(flow, flow_detail, backend, conf)
|
|
self._failures = {} # task uuid => failure
|
|
self._root = None
|
|
self._lock = threading.RLock()
|
|
self._state_lock = threading.RLock()
|
|
self.notifier = misc.TransitionNotifier()
|
|
self.task_notifier = misc.TransitionNotifier()
|
|
|
|
def _revert(self, current_failure=None):
|
|
self._change_state(states.REVERTING)
|
|
try:
|
|
state = self._root.revert(self)
|
|
except Exception:
|
|
with excutils.save_and_reraise_exception():
|
|
self._change_state(states.FAILURE)
|
|
|
|
self._change_state(state)
|
|
if state == states.SUSPENDED:
|
|
return
|
|
misc.Failure.reraise_if_any(self._failures.values())
|
|
if current_failure:
|
|
current_failure.reraise()
|
|
|
|
def __str__(self):
|
|
return "%s: %s" % (reflection.get_class_name(self), id(self))
|
|
|
|
def suspend(self):
|
|
"""Attempts to suspend the engine.
|
|
|
|
If the engine is currently running tasks then this will attempt to
|
|
suspend future work from being started (currently active tasks can
|
|
not currently be preempted) and move the engine into a suspend state
|
|
which can then later be resumed from.
|
|
"""
|
|
self._change_state(states.SUSPENDING)
|
|
|
|
@property
|
|
def execution_graph(self):
|
|
self.compile()
|
|
return self._root.graph
|
|
|
|
@lock_utils.locked
|
|
def run(self):
|
|
"""Runs the flow in the engine to completion."""
|
|
if self.storage.get_flow_state() == states.REVERTED:
|
|
self._reset()
|
|
self.compile()
|
|
external_provides = set(self.storage.fetch_all().keys())
|
|
missing = self._flow.requires - external_provides
|
|
if missing:
|
|
raise exc.MissingDependencies(self._flow, sorted(missing))
|
|
if self._failures:
|
|
self._revert()
|
|
else:
|
|
self._run()
|
|
|
|
def _run(self):
|
|
self._change_state(states.RUNNING)
|
|
try:
|
|
state = self._root.execute(self)
|
|
except Exception:
|
|
self._change_state(states.FAILURE)
|
|
self._revert(misc.Failure())
|
|
else:
|
|
self._change_state(state)
|
|
|
|
@lock_utils.locked(lock='_state_lock')
|
|
def _change_state(self, state):
|
|
old_state = self.storage.get_flow_state()
|
|
if not states.check_flow_transition(old_state, state):
|
|
return
|
|
self.storage.set_flow_state(state)
|
|
try:
|
|
flow_uuid = self._flow.uuid
|
|
except AttributeError:
|
|
# NOTE(harlowja): if the flow was just a single task, then it will
|
|
# not itself have a uuid, but the constructed flow_detail will.
|
|
if self._flow_detail is not None:
|
|
flow_uuid = self._flow_detail.uuid
|
|
else:
|
|
flow_uuid = None
|
|
details = dict(engine=self,
|
|
flow_name=self._flow.name,
|
|
flow_uuid=flow_uuid,
|
|
old_state=old_state)
|
|
self.notifier.notify(state, details)
|
|
|
|
def _on_task_state_change(self, task_action, state, result=None):
|
|
"""Notifies the engine that the following task action has completed
|
|
a given state with a given result. This is a *internal* to the action
|
|
engine and its associated action classes, not for use externally.
|
|
"""
|
|
if isinstance(result, misc.Failure):
|
|
self._failures[task_action.uuid] = result
|
|
details = dict(engine=self,
|
|
task_name=task_action.name,
|
|
task_uuid=task_action.uuid,
|
|
result=result)
|
|
self.task_notifier.notify(state, details)
|
|
|
|
def _reset(self):
|
|
for name, uuid in self.storage.reset_tasks():
|
|
details = dict(engine=self,
|
|
task_name=name,
|
|
task_uuid=uuid,
|
|
result=None)
|
|
self.task_notifier.notify(states.PENDING, details)
|
|
self._failures = {}
|
|
self._change_state(states.PENDING)
|
|
|
|
@lock_utils.locked
|
|
def compile(self):
|
|
"""Compiles the contained flow into a structure which the engine can
|
|
use to run or if this can not be done then an exception is thrown
|
|
indicating why this compilation could not be achieved.
|
|
"""
|
|
if self._root is not None:
|
|
return
|
|
|
|
assert self._graph_action is not None, ('Graph action class must be'
|
|
' specified')
|
|
self._change_state(states.RESUMING) # does nothing in PENDING state
|
|
task_graph = flow_utils.flatten(self._flow)
|
|
self._root = self._graph_action(task_graph)
|
|
loaded_failures = {}
|
|
|
|
for task in task_graph.nodes_iter():
|
|
try:
|
|
task_id = self.storage.get_uuid_by_name(task.name)
|
|
except exc.NotFound:
|
|
task_id = uuidutils.generate_uuid()
|
|
task_version = misc.get_version_string(task)
|
|
self.storage.add_task(task_name=task.name, uuid=task_id,
|
|
task_version=task_version)
|
|
try:
|
|
result = self.storage.get(task_id)
|
|
except exc.NotFound:
|
|
result = None
|
|
|
|
if isinstance(result, misc.Failure):
|
|
# NOTE(imelnikov): old failure may have exc_info which
|
|
# might get lost during serialization, so we preserve
|
|
# old failure object if possible.
|
|
old_failure = self._failures.get(task_id, None)
|
|
if result.matches(old_failure):
|
|
loaded_failures[task_id] = old_failure
|
|
else:
|
|
loaded_failures[task_id] = result
|
|
|
|
self.storage.set_result_mapping(task_id, task.save_as)
|
|
self._root.add(task, task_action.TaskAction(task, task_id))
|
|
self._failures = loaded_failures
|
|
self._change_state(states.SUSPENDED) # does nothing in PENDING state
|
|
|
|
@property
|
|
def is_running(self):
|
|
return self.storage.get_flow_state() == states.RUNNING
|
|
|
|
@property
|
|
def is_reverting(self):
|
|
return self.storage.get_flow_state() == states.REVERTING
|
|
|
|
|
|
class SingleThreadedActionEngine(ActionEngine):
|
|
# NOTE(harlowja): This one attempts to run in a serial manner.
|
|
_graph_action = graph_action.SequentialGraphAction
|
|
_storage_cls = t_storage.Storage
|
|
|
|
|
|
class MultiThreadedActionEngine(ActionEngine):
|
|
# NOTE(harlowja): This one attempts to run in a parallel manner.
|
|
_graph_action = graph_action.ParallelGraphAction
|
|
_storage_cls = t_storage.ThreadSafeStorage
|
|
|
|
def __init__(self, flow, flow_detail, backend, conf):
|
|
super(MultiThreadedActionEngine, self).__init__(
|
|
flow, flow_detail, backend, conf)
|
|
self._executor = conf.get('executor', None)
|
|
|
|
@lock_utils.locked
|
|
def run(self):
|
|
if self._executor is None:
|
|
# NOTE(harlowja): since no executor was provided we have to create
|
|
# one, and also ensure that we shutdown the one we create to
|
|
# ensure that we don't leak threads.
|
|
thread_count = threading_utils.get_optimal_thread_count()
|
|
self._executor = futures.ThreadPoolExecutor(thread_count)
|
|
owns_executor = True
|
|
else:
|
|
owns_executor = False
|
|
|
|
try:
|
|
ActionEngine.run(self)
|
|
finally:
|
|
# Don't forget to shutdown the executor!!
|
|
if owns_executor:
|
|
try:
|
|
self._executor.shutdown(wait=True)
|
|
finally:
|
|
self._executor = None
|
|
|
|
@property
|
|
def executor(self):
|
|
"""Returns the current executor, if no executor is provided on
|
|
construction then this executor will change each time the engine
|
|
is ran.
|
|
"""
|
|
return self._executor
|