Merge mistral tasks data to execution context

after this patch user can choose option whether to replace or merge task data to the execution context. ex: merge_strategy: replace/merge Implements: blueprint merge-mistral-tasks-data Change-Id: I3c96bab9953c4995f2b718ac48dff0f153872026
2022-12-26 16:11:21 +05:30 · 2022-12-26 16:11:21 +05:30 · 7c35734300
parent bfcc417044
commit 7c35734300
4 changed files with 442 additions and 2 deletions
--- a/doc/source/admin/configuration/config-guide.rst
+++ b/doc/source/admin/configuration/config-guide.rst
@ -105,6 +105,74 @@ directory.
   of OpenStack projects in your deployment. Please find more detailed
   information in ``tools/get_action_list.py`` script.

+#. Configure merge strategy feature if needed, It is needed to change default
+   Mistral variable interaction behavior of replacing one variable with another
+   inside own context.
+   For eg::
+
+      version: '2.0'
+      wf:
+      input:
+      - aa:
+            bb: wf_ex_input
+            cc: wf_ex_input
+            zz: wf_ex_input
+      output:
+         aa: <% $.aa %>
+      tasks:
+         task1:
+            action: std.echo
+            # emulate some action result
+            input:
+            output:
+               cc: task1_res
+               dd: task1_res
+            on-success: [task2]
+            publish:
+            aa:
+               cc: <% task().result["cc"] %>
+               dd: <% task().result["dd"] %>
+         task2:
+            action: std.echo
+            # emulate some action result
+            input:
+            output:
+               bb: task2_res
+            publish:
+            aa:
+               bb: <% task().result["bb"] %>
+
+   Default result of execution is::
+
+      {
+         "aa": {
+            "bb": "task2_res"
+         }
+      }
+
+   To merge results of tasks, we need to use flat data structure or the yaql
+   merge function.
+   merge_strategy config has following options:
+
+   * `replace` - It is the default value. It is an old behavior when variable replace each other in context.
+   * `merge` - If you set this value, variable is merged with other context.
+
+   Consider `merge` strategy with the same workflow as above. The result is::
+
+      {
+         "aa" : {
+            "bb": "task2_res",
+            "cc": "task1_res",
+            "dd": "task1_res",
+            "zz": "wf_ex_input",
+         }
+      }
+
+   merge_strategy can be configured as the following::
+
+      [engine]
+      merge_strategy = replace
+
 #. Configure Task affinity feature if needed. It is needed for distinguishing
   either single task executor or one task executor from group of task
   executors::
--- a/mistral/config.py
+++ b/mistral/config.py
@ -250,6 +250,13 @@ engine_opts = [
            'to start subworkflow via RPC to improve load balancing '
            'in case of several engine instances.'
        )
+    ),
+    cfg.StrOpt(
+        'merge_strategy',
+        choices=['replace', 'merge'],
+        default="replace",
+        help=_('Merge strategy of data inside workflow execution. '
+               '(replace, merge)')
    )
 ]

--- a/mistral/tests/unit/engine/test_merge_strategy.py
+++ b/mistral/tests/unit/engine/test_merge_strategy.py
@ -0,0 +1,356 @@
+#    Licensed under the Apache License, Version 2.0 (the "License");
+#    you may not use this file except in compliance with the License.
+#    You may obtain a copy of the License at
+#
+#        http://www.apache.org/licenses/LICENSE-2.0
+#
+#    Unless required by applicable law or agreed to in writing, software
+#    distributed under the License is distributed on an "AS IS" BASIS,
+#    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#    See the License for the specific language governing permissions and
+#    limitations under the License.
+
+from mistral.db.v2 import api as db_api
+from mistral.services import workflows as wf_service
+from mistral.tests.unit.engine import base
+from mistral.workflow import states
+from oslo_config import cfg
+
+# Use the set_default method to set value otherwise in certain test cases
+# the change in value is not permanent.
+cfg.CONF.set_default('auth_enable', False, group='pecan')
+
+
+class DirectWorkflowEngineTest(base.EngineTestCase):
+
+    def _run_workflow(self, wf_text, wf_input=None,
+                      expected_state=states.SUCCESS):
+        wf_service.create_workflows(wf_text)
+
+        wf_ex = self.engine.start_workflow('wf', wf_input=wf_input)
+
+        self.await_workflow_state(wf_ex.id, expected_state)
+
+        return db_api.get_workflow_execution(wf_ex.id)
+
+    def test_replace(self):
+        self.override_config('merge_strategy', 'replace',
+                             group='engine')
+        wf_text = """
+        version: '2.0'
+        wf:
+          input:
+            - aa:
+                bb: wf_ex_input
+                cc: wf_ex_input
+                zz: wf_ex_input
+          output:
+            aa: <% $.aa %>
+          tasks:
+            task1:
+              action: std.echo
+              # emulate some action result
+              input:
+                output:
+                  cc: task1_res
+                  dd: task1_res
+              on-success: [task2]
+              publish:
+                aa:
+                  cc: <% task().result["cc"] %>
+                  dd: <% task().result["dd"] %>
+            task2:
+              action: std.echo
+              # emulate some action result
+              input:
+                output:
+                  bb: task2_res
+              publish:
+                aa:
+                  bb: <% task().result["bb"] %>
+        """
+
+        wf_ex = self._run_workflow(wf_text)
+
+        with db_api.transaction():
+            wf_ex = db_api.get_workflow_execution(wf_ex.id)
+            wf_ex_res = wf_ex.output
+
+            task1 = self._assert_single_item(wf_ex.task_executions,
+                                             name='task1')
+            task1_publish = task1.published
+
+        expected_wf_ex_res = {
+            "aa": {
+                "bb": "task2_res"
+            }
+        }
+        self.assertDictEqual(expected_wf_ex_res, wf_ex_res)
+
+        expected_task1_res = {
+            "aa": {
+                "cc": "task1_res",
+                "dd": "task1_res"
+            }
+        }
+        self.assertDictEqual(expected_task1_res, task1_publish)
+
+    def test_merge_input_and_publish(self):
+        self.override_config('merge_strategy', 'merge',
+                             group='engine')
+
+        wf_text = """
+        version: '2.0'
+
+        wf:
+          input:
+            - aa:
+                bb:
+                  bb_1: wf_ex_input
+                  bb_2: wf_ex_input
+                cc: wf_ex_input
+          output:
+            aa: <% $.aa %>
+          tasks:
+            task1:
+              action: std.echo
+              # emulate some action result
+              input:
+                output:
+                  cc: task_res
+                  dd: task_res
+                  bb_2: task_res
+              publish:
+                aa:
+                  bb:
+                    bb_2: <% task().result["bb_2"] %>
+                  cc: <% task().result["cc"] %>
+                  dd: <% task().result["dd"] %>
+        """
+
+        wf_ex = self._run_workflow(wf_text)
+
+        with db_api.transaction():
+            wf_ex = db_api.get_workflow_execution(wf_ex.id)
+            wf_ex_res = wf_ex.output
+
+        expected_wf_ex_res = {
+            "aa": {
+                "bb": {
+                    "bb_1": "wf_ex_input",
+                    "bb_2": "task_res"
+                },
+                "cc": "task_res",
+                "dd": "task_res"
+            }
+        }
+        self.assertDictEqual(expected_wf_ex_res, wf_ex_res)
+
+    def test_merge_publish_two_tasks(self):
+        self.override_config('merge_strategy', 'merge',
+                             group='engine')
+        wf_text = """
+        version: '2.0'
+        wf:
+          input:
+            - aa:
+                bb: wf_ex_input
+                cc: wf_ex_input
+                zz: wf_ex_input
+          output:
+            aa: <% $.aa %>
+          tasks:
+            task1:
+              action: std.echo
+              # emulate some action result
+              input:
+                output:
+                  cc: task1_res
+                  dd: task1_res
+              on-success: [task2]
+              publish:
+                aa:
+                  cc: <% task().result["cc"] %>
+                  dd: <% task().result["dd"] %>
+            task2:
+              action: std.echo
+              # emulate some action result
+              input:
+                output:
+                  bb: task2_res
+              publish:
+                aa:
+                  bb: <% task().result["bb"] %>
+        """
+
+        wf_ex = self._run_workflow(wf_text)
+
+        with db_api.transaction():
+            wf_ex = db_api.get_workflow_execution(wf_ex.id)
+            wf_ex_res = wf_ex.output
+
+        expected_wf_ex_res = {
+            "aa": {
+                "bb": "task2_res",
+                "cc": "task1_res",
+                "dd": "task1_res",
+                "zz": "wf_ex_input"
+            }
+        }
+        self.assertDictEqual(expected_wf_ex_res, wf_ex_res)
+
+    def test_merge_publish_result_from_join(self):
+        self.override_config('merge_strategy', 'merge',
+                             group='engine')
+        wf_text = """
+        version: '2.0'
+        wf:
+          input:
+            - aa:
+                aa: wf_ex_input
+                bb: wf_ex_input
+                cc: wf_ex_input
+                zz: wf_ex_input
+                dd: wf_ex_input
+          output:
+            aa: <% $.aa %>
+          tasks:
+            task0:
+              action: std.echo
+              # emulate some action result
+              input:
+                output:
+                  res: task0_res
+              on-success: [task1, task2]
+              publish:
+                aa:
+                  aa: <% task().result["res"] %>
+                  aa_1: <% task().result["res"] %>
+            task1:
+              action: std.echo
+              # emulate some action result
+              input:
+                output:
+                  res: task1_res
+              on-success: [task3]
+              publish:
+                aa:
+                  bb: <% task().result["res"] %>
+                  bb_1: <% task().result["res"] %>
+            task2:
+              action: std.echo
+              input:
+                output:
+                  res: task2_res
+              on-success: [task3]
+              publish:
+                aa:
+                  cc: <% task().result["res"] %>
+                  cc_1: <% task().result["res"] %>
+            task3:
+              action: std.echo
+              join: all
+              input:
+                output:
+                  res: task3_res
+              publish:
+                aa:
+                  zz: <% $.aa.bb_1 + $.aa.cc_1 + $.aa.aa_1 %>
+                  zz_1: <% task().result["res"] %>
+        """
+
+        wf_ex = self._run_workflow(wf_text)
+
+        with db_api.transaction():
+            wf_ex = db_api.get_workflow_execution(wf_ex.id)
+            wf_ex_res = wf_ex.output
+
+        expected_wf_ex_res = {
+            "aa": {
+                "aa": "task0_res",
+                "aa_1": "task0_res",
+                "bb": "task1_res",
+                "bb_1": "task1_res",
+                "cc": "task2_res",
+                "cc_1": "task2_res",
+                "zz": "task1_restask2_restask0_res",
+                "zz_1": "task3_res",
+                "dd": "wf_ex_input"
+            }
+        }
+        self.assertDictEqual(expected_wf_ex_res, wf_ex_res)
+
+    def test_merge_publish_two_parallel_tasks(self):
+        self.override_config('merge_strategy', 'merge',
+                             group='engine')
+        wf_text = """
+        version: '2.0'
+        wf:
+          input:
+            - aa:
+                bb: wf_ex_input
+                cc: wf_ex_input
+                dd: wf_ex_input
+                ee: wf_ex_input
+                zz: wf_ex_input
+          output:
+            aa: <% $.aa %>
+          tasks:
+            task_1_1:
+              action: std.echo
+              # emulate some action result
+              input:
+                output:
+                  res: task_1_1_res
+              on-success: [task_2_1]
+              publish:
+                aa:
+                  bb: <% task().result["res"] %>
+            task_1_2:
+              action: std.echo
+              # emulate some action result
+              input:
+                output:
+                  res: task_1_2_res
+              on-success: [task_2_1]
+              publish:
+                aa:
+                  cc: <% task().result["res"] %>
+            task_2_1:
+              action: std.echo
+              # emulate some action result
+              join: all
+              input:
+                output:
+                  res: task_2_1_res
+              on-success: [task_3_1]
+              publish:
+                aa:
+                  dd: <% task().result["res"] %>
+            task_3_1:
+              action: std.echo
+              # emulate some action result
+              input:
+                output:
+                  res: task_3_1_res
+              publish:
+                aa:
+                  ee: <% task().result["res"] %>
+        """
+
+        wf_ex = self._run_workflow(wf_text)
+
+        with db_api.transaction():
+            wf_ex = db_api.get_workflow_execution(wf_ex.id)
+            wf_ex_res = wf_ex.output
+
+        expected_wf_ex_res = {
+            "aa": {
+                "bb": "task_1_1_res",
+                "cc": "task_1_2_res",
+                "dd": "task_2_1_res",
+                "ee": "task_3_1_res",
+                "zz": "wf_ex_input"
+            }
+        }
+        self.assertDictEqual(expected_wf_ex_res, wf_ex_res)
--- a/mistral/workflow/data_flow.py
+++ b/mistral/workflow/data_flow.py
@ -46,8 +46,14 @@ class ContextView(dict):

    def __init__(self, *dicts):
        super(ContextView, self).__init__()
+        if CONF.engine.merge_strategy == 'merge':
+            res = {}
+            for d in reversed(dicts):
+                res = utils.merge_dicts(res, d)

-        self.dicts = [d for d in dicts if d is not None]
+            self.dicts = [res]
+        else:
+            self.dicts = [d for d in dicts if d is not None]

    def __getitem__(self, key):
        for d in self.dicts:
@ -246,7 +252,10 @@ def evaluate_task_outbound_context(task_ex):
        if getattr(task_ex, 'in_context', None) is not None else {}
    )

-    return utils.update_dict(in_context, getattr(task_ex, 'published', {}))
+    if CONF.engine.merge_strategy == 'merge':
+        return utils.merge_dicts(in_context, getattr(task_ex, 'published', {}))
+    else:
+        return utils.update_dict(in_context, getattr(task_ex, 'published', {}))


 def evaluate_workflow_output(wf_ex, wf_output, ctx):