[MO] Implement TensorFlow 2 While and Keras RNN support in MO (openvi…

…notoolkit#3573) * [MO] Implement TensorFlow 2 While support in MO Signed-off-by: Roman Kazantsev <[email protected]> * Add extractors for both While and StatelessWhile and do minor changes Signed-off-by: Roman Kazantsev <[email protected]> * Improve update_body_graph function and manage graph names properly Signed-off-by: Roman Kazantsev <[email protected]> * Fix a map for original name of parameters from body and cond Signed-off-by: Roman Kazantsev <[email protected]> * Implement draft version of support of TF2 Keras RNN Signed-off-by: Roman Kazantsev <[email protected]> * Implement Keras LSTM and GRU support in MO Signed-off-by: Roman Kazantsev <[email protected]> * Improve code for Keras RNN support Signed-off-by: Roman Kazantsev <[email protected]> * Finalize implementation of TF2 Keras RNN support in MO Signed-off-by: Roman Kazantsev <[email protected]> * Apply the first part of the comments after review #1 Signed-off-by: Roman Kazantsev <[email protected]> * Avoid use of explicit values of port indices in the transformation Signed-off-by: Roman Kazantsev <[email protected]> * Finalize code after the first-round review Signed-off-by: Roman Kazantsev <[email protected]> * Apply comments after the second-round review Signed-off-by: Roman Kazantsev <[email protected]>
mikhail-treskin · Jan 21, 2021 · bacb842 · bacb842
1 parent 61ccde7
commit bacb842
Show file tree

Hide file tree

Showing 11 changed files with 618 additions and 13 deletions.
diff --git a/model-optimizer/automation/package_BOM.txt b/model-optimizer/automation/package_BOM.txt
@@ -404,6 +404,7 @@ extensions/front/tf/identity_ext.py
 extensions/front/tf/identityN_to_identity.py
 extensions/front/tf/InterpolateTransposes.py
 extensions/front/tf/IteratorGetNext_ext.py
+extensions/front/tf/KerasRNNTransformation.py
 extensions/front/tf/log_softmax_ext.py
 extensions/front/tf/LookupTableInsert_ext.py
 extensions/front/tf/LoopCond_ext.py
@@ -483,6 +484,8 @@ extensions/front/tf/UnpackPackReverseInputChannels.py
 extensions/front/tf/variable_ext.py
 extensions/front/tf/variables_values_freezing.py
 extensions/front/tf/WhereDecomposition.py
+extensions/front/tf/while_ext.py
+extensions/front/tf/WhileNormalize.py
 extensions/front/tf/yolo_v1.json
 extensions/front/tf/yolo_v1_tiny.json
 extensions/front/tf/yolo_v2.json

diff --git a/model-optimizer/extensions/back/SpecialNodesFinalization.py b/model-optimizer/extensions/back/SpecialNodesFinalization.py
@@ -1,5 +1,5 @@
 """
- Copyright (C) 2018-2020 Intel Corporation
+ Copyright (C) 2018-2021 Intel Corporation
 
  Licensed under the Apache License, Version 2.0 (the "License");
  you may not use this file except in compliance with the License.
@@ -15,7 +15,6 @@
 """
 import logging as log
 from collections import defaultdict
-from copy import copy
 
 import numpy as np
 
@@ -125,6 +124,11 @@ class RemoveConstToResult(BackReplacementPattern):
     """
     enabled = True
     force_clean_up = True
+    # TODO: remove this transformation once all plugins support constant value network.
+    # Do not run recursively since Const->Result sub-graph can be encountered in a body graph of Loop node
+    # and this sub-graph is needed to avoid dynamism created by Loop node
+    # in case using axis in output port map
+    run_not_recursively = True
 
     @staticmethod
     def pattern():

diff --git a/model-optimizer/extensions/front/standalone_const_eraser.py b/model-optimizer/extensions/front/standalone_const_eraser.py
@@ -1,5 +1,5 @@
 """
- Copyright (C) 2018-2020 Intel Corporation
+ Copyright (C) 2018-2021 Intel Corporation
 
  Licensed under the Apache License, Version 2.0 (the "License");
  you may not use this file except in compliance with the License.
@@ -22,6 +22,9 @@
 
 class StandaloneConstEraser(FrontReplacementSubgraph):
     enabled = True
+    # TODO: remove this transformation once all plugins support constant value network.
+    # Now it avoids to be run recursively since Const->Result sub-graph can be encountered in a body graph of Loop node
+    run_not_recursively = True
 
     @staticmethod
     def pattern():

diff --git a/model-optimizer/extensions/front/tf/KerasRNNTransformation.py b/model-optimizer/extensions/front/tf/KerasRNNTransformation.py
@@ -0,0 +1,268 @@
+"""
+ Copyright (C) 2017-2021 Intel Corporation
+
+ Licensed under the Apache License, Version 2.0 (the "License");
+ you may not use this file except in compliance with the License.
+ You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+"""
+
+import numpy as np
+
+from extensions.front.tf.WhileNormalize import WhileNormalize
+from extensions.ops.loop import Loop
+from mo.front.common.partial_infer.utils import int64_array
+from mo.front.common.replacement import FrontReplacementSubgraph
+from mo.front.tf.graph_utils import create_op_with_const_inputs
+from mo.graph.graph import Graph, Node, rename_nodes
+from mo.middle.pattern_match import find_pattern_matches, inverse_dict
+from mo.ops.const import Const
+from mo.ops.squeeze import Squeeze
+from mo.ops.unsqueeze import Unsqueeze
+
+
+def compute_input_port_idx(req_node: Node, loop_node: Node):
+    """
+    Computes input port index by which requested node is passed to Loop node
+    :param req_node: a node for which to find input port index is requested
+    :param loop_node: a node that can receive input data from requested node by some input port
+    :return: input port index
+    """
+    for destination in req_node.out_port(0).get_destinations():
+        if loop_node.id == destination.node.id:
+            return destination.idx
+    return None
+
+
+def find_subgraph_match_to_pattern(graph: Graph, body_pattern: dict):
+    """
+    Finds sub-graph matches corresponding pattern in graph
+    :param graph: a graph where to search for matched sub-graph
+    :param body_pattern: a pattern
+    :return: a list of sub-graph matches
+    """
+    matches = []
+    for match in find_pattern_matches(graph, **body_pattern):
+        match = inverse_dict(match)
+        for k in match:
+            match[k] = Node(graph, match[k])
+        matches.append(match)
+
+    return matches
+
+
+class KerasRNNInputSlicing(FrontReplacementSubgraph):
+    """
+    The transformation detects TensorFlow 2 pattern that corresponds to subsequent slicing of input.
+    It avoids TensorListFromTensor and TensorFlowGetItem operations and replaces the original sub-graph
+    by adding axis attribute for corresponding input port of Loop node.
+    The transformation is applicable to TensorFlow 2 Keras Simple RNN, GRU, and LSTM layers.
+    """
+    enabled = True
+
+    def run_before(self):
+        return [WhileNormalize]
+
+    @staticmethod
+    def pattern(**kwargs):
+        return dict(
+            nodes=[('unstack', dict(op='TensorListFromTensor')),
+                   ('while', dict(op='Loop'))],
+            edges=[('unstack', 'while')]
+        )
+
+    @staticmethod
+    def get_body_pattern():
+        return dict(
+            nodes=[('tensor_list', dict(op='Parameter')),
+                   ('current_iteration', dict(op='Parameter')),
+                   ('slicing', dict(op='TensorListGetItem')),
+                   ('const_increment', dict(op='Const')),
+                   ('increment_iteration', dict(op='Add')),
+                   ('increment_iteration_identity', dict(op='Identity')),
+                   ('increment_iteration_result', dict(op='Result'))],
+            edges=[('tensor_list', 'slicing', {'in': 0}),
+                   ('current_iteration', 'slicing', {'in': 1}),
+                   ('const_increment', 'increment_iteration', {'in': 1}),
+                   ('current_iteration', 'increment_iteration', {'in': 0}),
+                   ('increment_iteration', 'increment_iteration_identity', {'in': 0}),
+                   ('increment_iteration_identity', 'increment_iteration_result', {'in': 0})]
+        )
+
+    @staticmethod
+    def transform_keras_rnn_input_slicing(external_match: dict, internal_match: dict):
+        """
+        Transforms TensorFlow 2 input slicing into use of axis attribute for input port of Loop node
+        :param external_match: a match used for handling a part of the main graph responsible for input slicing
+        :param internal_match: a match used for handling a part of the body graph responsible for input slicing
+        """
+        loop_node = external_match['while']
+        unstack_node = external_match['unstack']
+        body_graph = loop_node['body']
+
+        tensor_list_get_item_node = internal_match['slicing']
+        unstack_placeholder = internal_match['tensor_list']
+        tensor_list_get_item_node_name = tensor_list_get_item_node.soft_get('name', tensor_list_get_item_node.id)
+
+        # 1. process the body graph to avoid unsupported operations: TensorListGetItem and TensorListSetItem
+        # replace TensorListGetItem with Squeeze node and iterate through slices using axis for input port
+        squeeze_list_element = create_op_with_const_inputs(body_graph, Squeeze, {1: int64_array(0)},
+                                                           {'name': 'TensorListGetItemSqueeze'})
+        tensor_list_get_item_node.in_port(0).get_connection().set_destination(squeeze_list_element.in_port(0))
+        tensor_list_get_item_node.out_port(0).get_connection().set_source(squeeze_list_element.out_port(0))
+        rename_nodes([(tensor_list_get_item_node, tensor_list_get_item_node_name + '/AbandonedName'),
+                      (squeeze_list_element, tensor_list_get_item_node_name)])
+        unstack_placeholder_layer_id = unstack_placeholder.internal_layer_id
+        Loop.update_port_map_value_ext(loop_node.input_port_map, 'internal_layer_id', unstack_placeholder_layer_id,
+                                       'axis', 0)
+
+        # 2. process locality of Loop node in the main graph to avoid unsupported operations:
+        # TensorListFromTensor, TensorListReserve, and TensorListStack
+        # remove TensorListFromTensor and pass a tensor to Loop as is
+        unstack_node.out_port(0).get_connection().set_source(unstack_node.in_port(0).get_connection().get_source())
+
+    def replace_sub_graph(self, graph: Graph, external_match: dict):
+        loop_node = external_match['while']
+        body_graph = loop_node['body']
+        body_pattern = KerasRNNInputSlicing.get_body_pattern()
+        internal_matches = find_subgraph_match_to_pattern(body_graph, body_pattern)
+
+        # a case of multiple matches is not handled since it is not clear how to select corresponding match
+        if len(internal_matches) == 1:
+            internal_match = internal_matches[0]
+            loop_node = external_match['while']
+            unstack_port_idx = compute_input_port_idx(external_match['unstack'], loop_node)
+            # check that back edges connect correct Parameter and Result nodes in the body
+            # check connections between body input ports and external inputs ports of Loop node
+            if Loop.back_edge_exists(loop_node.back_edges,
+                                     internal_match['increment_iteration_result'].internal_layer_id,
+                                     internal_match['current_iteration'].internal_layer_id) and \
+                    Loop.inter_edge_exists(loop_node.input_port_map, unstack_port_idx,
+                                           internal_match['tensor_list'].internal_layer_id):
+                # only if inter-graph match passed it starts to process the sub-graph
+                KerasRNNInputSlicing.transform_keras_rnn_input_slicing(external_match, internal_match)
+
+
+class KerasRNNOutputConcatenation(FrontReplacementSubgraph):
+    """
+    The transformation detects TensorFlow 2 pattern that corresponds to concatenation of intermediate results
+    generated in each iteration of While operation.
+    It avoids TensorListReserve, TensorListStack, and TensorListSetItem operations and replaces the original sub-graph
+    by adding axis attribute for corresponding output port of Loop node.
+    The transformation is applicable to TensorFlow 2 Keras Simple RNN, GRU, and LSTM layers.
+    """
+    enabled = True
+
+    def run_before(self):
+        return [WhileNormalize]
+
+    @staticmethod
+    def pattern(**kwargs):
+        return dict(
+            nodes=[('reserve', dict(op='TensorListReserve')),
+                   ('while', dict(op='Loop')),
+                   ('stack', dict(op='TensorListStack'))],
+            edges=[('reserve', 'while'),
+                   ('while', 'stack')]
+        )
+
+    @staticmethod
+    def get_body_pattern():
+        return dict(
+            nodes=[('container', dict(op='Parameter')),
+                   ('current_iteration', dict(op='Parameter')),
+                   ('const_increment', dict(op='Const')),
+                   ('increment_iteration', dict(op='Add')),
+                   ('increment_iteration_identity', dict(op='Identity')),
+                   ('increment_iteration_result', dict(op='Result')),
+                   ('concatenation', dict(op='TensorListSetItem')),
+                   ('concatenation_identity', dict(op='Identity')),
+                   ('concatenation_result', dict(op='Result')),
+                   ],
+            edges=[('const_increment', 'increment_iteration', {'in': 1}),
+                   ('current_iteration', 'increment_iteration', {'in': 0}),
+                   ('container', 'concatenation', {'in': 0}),
+                   ('current_iteration', 'concatenation', {'in': 1}),
+                   ('concatenation', 'concatenation_identity', {'in': 0}),
+                   ('concatenation_identity', 'concatenation_result', {'in': 0}),
+                   ('increment_iteration', 'increment_iteration_identity', {'in': 0}),
+                   ('increment_iteration_identity', 'increment_iteration_result', {'in': 0})]
+        )
+
+    @staticmethod
+    def transform_keras_rnn_output_concatenation(external_match: dict, internal_match: dict):
+        """
+        Transforms TensorFlow 2 output concatenation into use of axis attribute for output port of Loop node
+        :param external_match: a match used for handling a part of the main graph responsible for output concatenation
+        :param internal_match: a match used for handling a part of the body graph responsible for output concatenation
+        """
+        loop_node = external_match['while']
+        stack_node = external_match['stack']
+        list_reserve_node = external_match['reserve']
+        body_graph = loop_node['body']
+
+        tensor_list_set_item_node = internal_match['concatenation']
+        tensor_list_set_item_node_name = tensor_list_set_item_node.soft_get('name', tensor_list_set_item_node.id)
+        list_result_node = internal_match['concatenation_result']
+
+        # replace TensorListSetItem with Unsqueeze and use axis attribute for corresponding Result node
+        # to concatenate results from different iterations
+        unsqueeze_list_element = create_op_with_const_inputs(body_graph, Unsqueeze, {1: int64_array(0)},
+                                                             {'name': 'TensorListSetItemUnsqueeze'})
+        tensor_list_set_item_node.in_port(2).get_connection().set_destination(unsqueeze_list_element.in_port(0))
+        tensor_list_set_item_node.out_port(0).get_connection().set_source(unsqueeze_list_element.out_port(0))
+        rename_nodes([(tensor_list_set_item_node, tensor_list_set_item_node_name + '/AbandonedName'),
+                      (unsqueeze_list_element, tensor_list_set_item_node_name)])
+        list_result_node_layer_id = list_result_node.internal_layer_id
+        Loop.update_port_map_value_ext(loop_node.output_port_map, 'internal_layer_id', list_result_node_layer_id,
+                                       'axis', 0)
+
+        # remove TensorListStack to by-pass the node since the result from the Loop node is already concatenated
+        stack_node.out_port(0).get_connection().set_source(stack_node.in_port(0).get_connection().get_source())
+
+        # disconnect ListReserve node because it is no longer needed for Loop
+        list_reserve_node.out_port(0).disconnect()
+
+        # connect a number of iterations with trip count that can be received from the second input of ListReserve
+        # create a constant network with True value for execution_condition so that IE can ignore execution condition
+        # and perform trip_counts iterations. This approach with known trip count value allows to avoid dynamism.
+        loop_node.in_port(1).disconnect()
+        list_reserve_node.in_port(1).get_source().connect(loop_node.in_port(1))
+        for record in loop_node.output_port_map:
+            if 'purpose' in record and record['purpose'] == 'execution_condition':
+                exec_cond_layer_id = record['internal_layer_id']
+                exec_cond_node = Loop.get_body_node_by_internal_id(loop_node, exec_cond_layer_id)
+                const_true = Const(body_graph, {'value': np.array(True, dtype=np.bool)}).create_node()
+                exec_cond_node.in_port(0).get_connection().set_source(const_true.out_port(0))
+
+    def replace_sub_graph(self, graph: Graph, external_match: dict):
+        loop_node = external_match['while']
+        body_graph = loop_node['body']
+        body_pattern = KerasRNNOutputConcatenation.get_body_pattern()
+
+        internal_matches = find_subgraph_match_to_pattern(body_graph, body_pattern)
+
+        if len(internal_matches) == 1:
+            internal_match = internal_matches[0]
+            reserve_port_idx = compute_input_port_idx(external_match['reserve'], loop_node)
+            stack_port_idx = external_match['stack'].in_port(0).get_source().idx
+            # check that back edges connect correct Parameter and Result nodes in the body
+            # check connections between body input ports and external inputs ports of Loop node
+            # check connections between body output ports and external output ports of Loop node
+            if Loop.back_edge_exists(loop_node.back_edges, internal_match['concatenation_result'].internal_layer_id,
+                                     internal_match['container'].internal_layer_id) and \
+                    Loop.back_edge_exists(loop_node.back_edges,
+                                          internal_match['increment_iteration_result'].internal_layer_id,
+                                          internal_match['current_iteration'].internal_layer_id) and \
+                    Loop.inter_edge_exists(loop_node.input_port_map, reserve_port_idx,
+                                           internal_match['container'].internal_layer_id) and \
+                    Loop.inter_edge_exists(loop_node.output_port_map, stack_port_idx,
+                                           internal_match['concatenation_result'].internal_layer_id):
+                KerasRNNOutputConcatenation.transform_keras_rnn_output_concatenation(external_match, internal_match)
diff --git a/model-optimizer/extensions/front/tf/WhileNormalize.py b/model-optimizer/extensions/front/tf/WhileNormalize.py
@@ -0,0 +1,53 @@
+"""
+ Copyright (C) 2017-2021 Intel Corporation
+
+ Licensed under the Apache License, Version 2.0 (the "License");
+ you may not use this file except in compliance with the License.
+ You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+"""
+
+import numpy as np
+
+from extensions.ops.loop import Loop
+from mo.front.common.replacement import FrontReplacementSubgraph
+from mo.graph.graph import Graph, Node
+from mo.ops.const import Const
+
+
+class WhileNormalize(FrontReplacementSubgraph):
+    """
+    Normalize inputs for Loop replacing TensorFlow 2 While operation:
+    1) Remove external input port for current iteration
+    2) Move trip count from port #1 to port #0
+    3) Occupy port #1 for execution condition
+    """
+    enabled = True
+
+    def find_and_replace_pattern(self, graph: Graph):
+        for node in graph.get_op_nodes(op='Loop'):
+            self.normalize_loop_node(graph, node)
+
+    @staticmethod
+    def normalize_loop_node(graph: Graph, loop_node: Node):
+        loop_name = loop_node.soft_get('name', loop_node.id)
+
+        # disconnect current iteration from external port #0 and move trip count to this port
+        loop_node.in_port(0).disconnect()
+        loop_node.in_port(1).get_connection().add_destination(loop_node.in_port(0))
+        Loop.update_port_map_value(loop_node.input_port_map, 'external_port_id', 1, 0)
+
+        # connect execution condition port
+        exec_cond_node = Const(graph, {'name': loop_name + '/ExecutionConditionValue',
+                                       'value': np.array(True, dtype=np.bool)}).create_node()
+        loop_node.in_port(1).get_connection().set_source(exec_cond_node.out_port(0))
+
+        loop_node.body.clean_up()
+        Loop.normalize_input_output_ports(loop_node)