From 90bf6c6846ca6a49b44547c5d5877e21dd121932 Mon Sep 17 00:00:00 2001 From: "Maxim, Vafin" Date: Fri, 24 Apr 2020 17:05:49 +0300 Subject: [PATCH 01/31] [MO] Implement EmbeddingBag_3 --- .../extensions/front/ATenToEmbeddingBag.py | 18 ++- .../extensions/front/onnx/aten_ext.py | 3 +- .../extensions/middle/EmbeddingBagResolver.py | 111 --------------- .../middle/EmbeddingBagResolver_test.py | 127 ------------------ model-optimizer/extensions/ops/aten.py | 2 +- .../extensions/ops/embedding_bag.py | 102 ++++++++++---- 6 files changed, 94 insertions(+), 269 deletions(-) delete mode 100644 model-optimizer/extensions/middle/EmbeddingBagResolver.py delete mode 100644 model-optimizer/extensions/middle/EmbeddingBagResolver_test.py diff --git a/model-optimizer/extensions/front/ATenToEmbeddingBag.py b/model-optimizer/extensions/front/ATenToEmbeddingBag.py index 5c0cc434add802..c76cef84161068 100644 --- a/model-optimizer/extensions/front/ATenToEmbeddingBag.py +++ b/model-optimizer/extensions/front/ATenToEmbeddingBag.py @@ -14,7 +14,7 @@ limitations under the License. """ -from extensions.ops.embedding_bag import EmbeddingBag +from extensions.ops.embedding_bag import EmbeddingBagOffsetsSum, EmbeddingBagPackedSum from mo.front.common.replacement import FrontReplacementPattern from mo.graph.graph import Graph, rename_node @@ -27,11 +27,21 @@ class AtenToEmbeddingBag(FrontReplacementPattern): def find_and_replace_pattern(self, graph: Graph): for node in graph.get_op_nodes(op='ATen', operator='embedding_bag'): + assert node.has_valid('mode') and node.mode == 0, 'ATen::embedding_bag has unsupported mode, only "sum" ' \ + 'mode is supported for node {}.'.format(node.id) node_name = node.name rename_node(node, node_name + '/Old') - embedding_bag = EmbeddingBag(graph, {'name': node_name, 'mode': node.mode, - 'scale_grad_by_freq': node.scale_grad_by_freq}).create_node() + indices_shape = node.in_port(1).data.get_shape() + if len(indices_shape) == 2: + embedding_bag = EmbeddingBagPackedSum(graph, {'name': node_name}).create_node() + per_sample_weights_port_id = 2 + else: + embedding_bag = EmbeddingBagOffsetsSum(graph, {'name': node_name}).create_node() + per_sample_weights_port_id = 3 + node.in_port(2).get_connection().set_destination(embedding_bag.in_port(2)) node.in_port(0).get_connection().set_destination(embedding_bag.in_port(0)) node.in_port(1).get_connection().set_destination(embedding_bag.in_port(1)) - node.in_port(2).get_connection().set_destination(embedding_bag.in_port(2)) node.out_port(0).get_connection().set_source(embedding_bag.out_port(0)) + if len(node.in_ports()) == 4 and not node.in_port(3).disconnected(): + node.in_port(3).get_connection().set_destination(embedding_bag.in_port(per_sample_weights_port_id)) + diff --git a/model-optimizer/extensions/front/onnx/aten_ext.py b/model-optimizer/extensions/front/onnx/aten_ext.py index f55b341a16e0a1..502830f406b68a 100644 --- a/model-optimizer/extensions/front/onnx/aten_ext.py +++ b/model-optimizer/extensions/front/onnx/aten_ext.py @@ -26,7 +26,6 @@ class ATenFrontExtractor(FrontExtractorOp): def extract(cls, node): mode = onnx_attr(node, 'mode', 'i', default=1) operator = onnx_attr(node, 'operator', 's').decode() - scale_grad_by_freq = onnx_attr(node, 'scale_grad_by_freq', 'i', default=0) - ATen.update_node_stat(node, {'operator': operator, 'mode': mode, 'scale_grad_by_freq': scale_grad_by_freq}) + ATen.update_node_stat(node, {'operator': operator, 'mode': mode}) return cls.enabled diff --git a/model-optimizer/extensions/middle/EmbeddingBagResolver.py b/model-optimizer/extensions/middle/EmbeddingBagResolver.py deleted file mode 100644 index 3582677ff2a967..00000000000000 --- a/model-optimizer/extensions/middle/EmbeddingBagResolver.py +++ /dev/null @@ -1,111 +0,0 @@ -""" - Copyright (c) 2018-2019 Intel Corporation - - Licensed under the Apache License, Version 2.0 (the "License"); - you may not use this file except in compliance with the License. - You may obtain a copy of the License at - - http://www.apache.org/licenses/LICENSE-2.0 - - Unless required by applicable law or agreed to in writing, software - distributed under the License is distributed on an "AS IS" BASIS, - WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - See the License for the specific language governing permissions and - limitations under the License. -""" -import logging as log - -import numpy as np - -from extensions.ops.gather import Gather -from extensions.ops.parameter import Parameter -from extensions.ops.sparse_weighted_sum import ExperimentalSparseWeightedSum -from mo.front.common.partial_infer.utils import int64_array -from mo.front.tf.graph_utils import create_op_with_const_inputs -from mo.graph.graph import Graph -from mo.middle.replacement import MiddleReplacementPattern -from mo.ops.concat import Concat - - -class EmbeddingBagResolver(MiddleReplacementPattern): - ''' - Replace EmbeddingBag with Gather or SparseWeightedSum. - If shape of offsets is equal to shape of indices it means that offsets are obsolete because they have to define - "bags" of shape 1 and we can remove offsets and replace EmbeddingBag with just Gather. In another case offsets must - be used and EmbeddingBag can be replaced by SparseWeightedSum, but offsets must be pre-processed. - ''' - enabled = True - force_clean_up = True - - def find_and_replace_pattern(self, graph: Graph): - weighted_sum_nodes = list() - index_shape = None - merge_offsets = True - - for node in graph.get_op_nodes(op='EmbeddingBag'): - weights_shape = node.in_port(0).data.get_shape() - indices_shape = node.in_port(1).data.get_shape() - offsets_shape = node.in_port(2).data.get_shape() - - assert node.scale_grad_by_freq == 0 - - if indices_shape[0] == offsets_shape[0]: - # The simple case when we can replace EmbeddingBag with just Gather and not use offsets node at all - gather = create_op_with_const_inputs(graph, Gather, {2: int64_array(0)}, - {'name': node.name + '/Emb_Bag/Gather_'}) - - node.in_port(0).get_connection().set_destination(gather.in_port(0)) - node.in_port(1).get_connection().set_destination(gather.in_port(1)) - node.out_port(0).get_connection().set_source(gather.out_port(0)) - else: - assert node.mode == 0 - - dense_shape = int64_array([offsets_shape[0], indices_shape[0]]) - default_index = int64_array(weights_shape[0]) - sweightedsum = create_op_with_const_inputs(graph, ExperimentalSparseWeightedSum, - {2: dense_shape, 4: default_index}, - {'name': node.name + '/WeightedSum'}) - if index_shape is None: - index_shape = indices_shape[-1] - else: - merge_offsets = merge_offsets and index_shape == indices_shape[-1] - weighted_sum_nodes.append((sweightedsum, indices_shape[-1])) - - default_embeddings = np.zeros([1, weights_shape[-1]]) - weights_concat = create_op_with_const_inputs(graph, Concat, {1: default_embeddings}, - {'axis': 0, 'in_ports_count': 2}) - node.in_port(0).get_connection().set_destination(weights_concat.in_port(0)) - node.in_port(1).get_connection().set_destination(sweightedsum.in_port(1)) - weights_concat.out_port(0).connect(sweightedsum.in_port(3)) - - node.out_port(0).get_connection().set_source(sweightedsum.out_port(0)) - self.create_offsets_for_weighted_sum(graph, weighted_sum_nodes, merge_offsets, index_shape) - - def create_offsets_for_weighted_sum(self, graph, weighted_sum_nodes, merge_offsets, index_shape): - new_offsets = None - for i, (node, ind_shape) in enumerate(weighted_sum_nodes): - if merge_offsets and len(weighted_sum_nodes) > 1: - # generate single offsets input if possible - if new_offsets is None: - shape = int64_array([len(weighted_sum_nodes), index_shape, 2]) - new_offsets = Parameter(graph, {'name': 'Emb_Bag/offsets', - 'shape': shape, - 'data_type': np.int32}).create_node() - log.error( - 'Pre-process of offsets is needed for generated input "Emb_Bag/offsets" of shape: {}. ' - 'Refer to the documentation on how to convert the ONNX* DLRM model'.format(shape), - extra={'is_warning': True}) - gather = create_op_with_const_inputs(graph, Gather, {1: int64_array(i), 2: int64_array(0)}, - {'name': node.name + '/Gather_'}) - new_offsets.out_port(0).connect(gather.in_port(0)) - gather.out_port(0).connect(node.in_port(0)) - else: - shape = int64_array([ind_shape, 2]) - new_offsets = Parameter(graph, {'name': 'Emb_Bag/offsets{}'.format(i), - 'shape': shape, - 'data_type': np.int32}).create_node() - new_offsets.out_port(0).connect(node.in_port(0)) - log.error( - 'Pre-process of offsets is needed for generated input "Emb_Bag/offsets{}" of shape: {}. ' - 'Refer to the documentation on how to convert the ONNX* DLRM model'.format(i, shape), - extra={'is_warning': True}) diff --git a/model-optimizer/extensions/middle/EmbeddingBagResolver_test.py b/model-optimizer/extensions/middle/EmbeddingBagResolver_test.py deleted file mode 100644 index c3627d076103d6..00000000000000 --- a/model-optimizer/extensions/middle/EmbeddingBagResolver_test.py +++ /dev/null @@ -1,127 +0,0 @@ -""" - Copyright (C) 2020 Intel Corporation - - Licensed under the Apache License, Version 2.0 (the "License"); - you may not use this file except in compliance with the License. - You may obtain a copy of the License at - - http://www.apache.org/licenses/LICENSE-2.0 - - Unless required by applicable law or agreed to in writing, software - distributed under the License is distributed on an "AS IS" BASIS, - WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - See the License for the specific language governing permissions and - limitations under the License. -""" -import unittest - -import numpy as np - -from extensions.middle.EmbeddingBagResolver import EmbeddingBagResolver -from mo.utils.ir_engine.compare_graphs import compare_graphs -from mo.utils.unittest.graph import build_graph - -nodes_attributes = {'node_1': {'value': None, 'kind': 'op', 'op': 'EmbeddingBag', 'scale_grad_by_freq': 0, 'mode': 0}, - 'node_1_data': {'value': None, 'kind': 'data', 'data_type': None}, - 'node_2': {'value': None, 'kind': 'op', 'op': 'EmbeddingBag', 'scale_grad_by_freq': 0, 'mode': 0}, - 'node_2_data': {'value': None, 'kind': 'data', 'data_type': None}, - 'gather_1': {'type': 'Gather', 'value': None, 'kind': 'op'}, - 'gather_1_data': {'value': None, 'kind': 'data', 'data_type': None}, - 'ws_1': {'type': 'ExperimentalSparseWeightedSum', 'value': None, 'kind': 'op'}, - 'ws_1_data': {'value': None, 'kind': 'data', 'data_type': None}, - 'const_axis': {'type': 'Const', 'kind': 'op', 'op': 'Const', 'value': None, 'shape': None}, - 'axis_data': {'value': None, 'kind': 'data', 'data_type': None}, - 'const_default': {'type': 'Const', 'kind': 'op', 'op': 'Const', 'value': None, 'shape': None}, - 'default_data': {'value': None, 'kind': 'data', 'data_type': None}, - 'const_dense_shape': {'type': 'Const', 'kind': 'op', 'op': 'Const', 'value': None, 'shape': None}, - 'dense_shape_data': {'value': None, 'kind': 'data', 'data_type': None}, - 'const': {'type': 'Const', 'kind': 'op', 'op': 'Const', 'value': None, 'shape': None}, - 'const_data': {'value': None, 'kind': 'data', 'data_type': None}, - 'concat': {'type': 'Concat', 'value': None, 'kind': 'op'}, - 'concat_data': {'value': None, 'kind': 'data', 'data_type': None}, - # Placeholders - 'indices': {'shape': None, 'type': 'Parameter', 'kind': 'op', 'op': 'Parameter'}, - 'indices_data': {'value': None, 'shape': None, 'kind': 'data', 'data_type': None}, - 'offsets': {'shape': None, 'type': 'Parameter', 'kind': 'op', 'op': 'Parameter'}, - 'offsets_data': {'value': None, 'shape': None, 'kind': 'data', 'data_type': None}, - 'const_weights': {'type': 'Const', 'kind': 'op', 'op': 'Const', 'value': None, 'shape': None}, - 'weights_data': {'value': None, 'shape': None, 'kind': 'data', 'data_type': None}, - - 'op_output': {'kind': 'op', 'op': 'Result', 'infer': lambda x: None} - } - - -class EmbeddingBagResolverTests(unittest.TestCase): - def test_embedding_bag_to_gather(self): - graph = build_graph(nodes_attributes, - [('const_weights', 'weights_data'), - ('weights_data', 'node_1'), - ('indices', 'indices_data'), - ('indices_data', 'node_1'), - ('offsets', 'offsets_data'), - ('offsets_data', 'node_1'), - ('node_1', 'node_1_data'), - ('node_1_data', 'op_output') - ], - {'indices_data': {'shape': np.array([128])}, - 'offsets_data': {'shape': np.array([128])}}, - nodes_with_edges_only=True) - - graph_ref = build_graph(nodes_attributes, - [('const_weights', 'weights_data'), - ('weights_data', 'gather_1'), - ('indices', 'indices_data'), - ('indices_data', 'gather_1'), - ('const_axis', 'axis_data'), - ('axis_data', 'gather_1'), - ('gather_1', 'gather_1_data'), - ('gather_1_data', 'op_output') - ], - {'indices_data': {'shape': np.array([128])}}, - nodes_with_edges_only=True) - graph.graph['layout'] = 'NCHW' - EmbeddingBagResolver().find_and_replace_pattern(graph) - (flag, resp) = compare_graphs(graph, graph_ref, 'op_output') - self.assertTrue(flag, resp) - - def test_embedding_bag_to_single_weighted_sum(self): - graph = build_graph(nodes_attributes, - [('const_weights', 'weights_data'), - ('weights_data', 'node_1'), - ('indices', 'indices_data'), - ('indices_data', 'node_1'), - ('offsets', 'offsets_data'), - ('offsets_data', 'node_1'), - ('node_1', 'node_1_data'), - ('node_1_data', 'op_output') - ], - {'indices_data': {'shape': np.array([128])}, - 'offsets_data': {'shape': np.array([64])}, - 'weights_data': {'shape': np.array([1024, 16])}}, - nodes_with_edges_only=True) - - graph_ref = build_graph(nodes_attributes, - [('const_weights', 'weights_data'), - ('const', 'const_data'), - ('weights_data', 'concat'), - ('const_data', 'concat'), - ('concat', 'concat_data'), - ('offsets', 'offsets_data'), - ('indices', 'indices_data'), - ('const_default', 'default_data'), - ('const_dense_shape', 'dense_shape_data'), - ('offsets_data', 'ws_1'), - ('indices_data', 'ws_1'), - ('dense_shape_data', 'ws_1'), - ('concat_data', 'ws_1'), - ('default_data', 'ws_1'), - ('ws_1', 'ws_1_data'), - ('ws_1_data', 'op_output') - ], - {'indices_data': {'shape': np.array([128])}, - 'offsets': {'shape': np.array([128, 2])}}, - nodes_with_edges_only=True) - graph.graph['layout'] = 'NCHW' - EmbeddingBagResolver().find_and_replace_pattern(graph) - (flag, resp) = compare_graphs(graph, graph_ref, 'op_output') - self.assertTrue(flag, resp) diff --git a/model-optimizer/extensions/ops/aten.py b/model-optimizer/extensions/ops/aten.py index f1c68f9aec7efd..92a045d2340cc4 100644 --- a/model-optimizer/extensions/ops/aten.py +++ b/model-optimizer/extensions/ops/aten.py @@ -31,4 +31,4 @@ def __init__(self, graph: Graph, attrs: dict): }, attrs) def supported_attrs(self): - return ['mode', 'operator', 'scale_grad_by_freq'] + return ['mode', 'operator'] diff --git a/model-optimizer/extensions/ops/embedding_bag.py b/model-optimizer/extensions/ops/embedding_bag.py index 28d44fa776ffd7..0597b49fe4b2a6 100644 --- a/model-optimizer/extensions/ops/embedding_bag.py +++ b/model-optimizer/extensions/ops/embedding_bag.py @@ -14,53 +14,107 @@ limitations under the License. """ -from mo.front.common.partial_infer.utils import int64_array from mo.graph.graph import Node, Graph from mo.ops.op import Op +import numpy as np -class EmbeddingBag(Op): - ''' - This is nn.EmbeddingBag from Pytorch. It is a simple lookup table that stores embeddings of a fixed dictionary and - size and computes sums or means of "bags" of embeddings, without instantiating the intermediate embeddings. - Inputs: - 0: Weights (num_embeddings, embedding_dim) - the lookup table - 1: Indices (N,) - indices to get from lookup table - 2: Offsets (B,) - index in indices tensor on which each bag starts - Output: - 0: Embeddings (B, embedding_dim) - ''' - op = 'EmbeddingBag' - enabled = False + +class EmbeddingBagOffsetsSum(Op): + op = 'EmbeddingBagOffsetsSum' + enabled = True def __init__(self, graph: Graph, attrs: dict): super().__init__(graph, { 'op': self.op, - 'type': None, + 'type': self.op, 'infer': self.infer, - 'in_ports_count': 3, + 'in_ports_count': 5, 'out_ports_count': 1, }, attrs) - def supported_attrs(self): - return ['mode', 'scale_grad_by_freq'] - @staticmethod def infer(node: Node): name = node.soft_get('name', node.id) connected_in_ports = {idx: port for idx, port in node.in_ports().items() if not port.disconnected()} - assert len(connected_in_ports) == 3 and 0 in connected_in_ports and 1 in connected_in_ports and \ - 2 in connected_in_ports, "EmbeddingBag should have 3 connected input port, but it doesn't for " \ - "node: `{}`. Ports: {}".format(name, connected_in_ports) + assert len(connected_in_ports) >= 3 and 0 in connected_in_ports and 1 in connected_in_ports and \ + 2 in connected_in_ports, "EmbeddingBag should have at least 3 connected input port, but it doesn't " \ + "for node: `{}`. Ports: {}".format(name, connected_in_ports) weights = node.in_port(0).data.get_value() - assert weights is not None and len(weights.shape) == 2 + assert weights is not None and len(weights.shape) >= 2 input_shape = node.in_port(1).data.get_shape() assert input_shape is not None offsets_shape = node.in_port(2).data.get_shape() assert offsets_shape is not None and len(offsets_shape) == 1 - node.out_port(0).data.set_shape(int64_array([offsets_shape[0], weights.shape[1]])) + node.out_port(0).data.set_shape(np.concatenate((input_shape[0], weights.shape[1:]), dtype=np.int64)) + + +class EmbeddingBagPackedSum(Op): + op = 'EmbeddingBagPackedSum' + enabled = True + + def __init__(self, graph: Graph, attrs: dict): + super().__init__(graph, { + 'op': self.op, + 'type': self.op, + + 'infer': self.infer, + + 'in_ports_count': 3, + 'out_ports_count': 1, + }, attrs) + + @staticmethod + def infer(node: Node): + name = node.soft_get('name', node.id) + + connected_in_ports = {idx: port for idx, port in node.in_ports().items() if not port.disconnected()} + assert len(connected_in_ports) >= 2 and 0 in connected_in_ports and 1 in connected_in_ports, \ + "EmbeddingBagPackedSum should have at least 2 connected input port, but it doesn't for node: `{}`. " \ + "Ports: {}".format(name, connected_in_ports) + + weights = node.in_port(0).data.get_value() + assert weights is not None and len(weights.shape) >= 2 + input_shape = node.in_port(1).data.get_shape() + assert input_shape is not None + + node.out_port(0).data.set_shape(np.concatenate((input_shape[0], weights.shape[1:]), dtype=np.int64)) + + +class EmbeddingSegmentsSum(Op): + op = 'EmbeddingSegmentsSum' + enabled = True + + def __init__(self, graph: Graph, attrs: dict): + super().__init__(graph, { + 'op': self.op, + 'type': self.op, + + 'infer': self.infer, + + 'in_ports_count': 6, + 'out_ports_count': 1, + }, attrs) + + @staticmethod + def infer(node: Node): + name = node.soft_get('name', node.id) + + connected_in_ports = {idx: port for idx, port in node.in_ports().items() if not port.disconnected()} + assert len(connected_in_ports) >= 4 and 0 in connected_in_ports and 1 in connected_in_ports and \ + 2 in connected_in_ports and 3 in connected_in_ports, \ + "EmbeddingSegmentsSum should have at least 4 connected input port, but it doesn't for node: `{}`. " \ + "Ports: {}".format(name, connected_in_ports) + + weights = node.in_port(0).data.get_value() + assert weights is not None and len(weights.shape) >= 2 + num_segments = node.in_port(2).data.get_value() + assert num_segments is not None, "EmbeddingSegmentsSum should have a constant num_segments provided, but it " \ + "doesn't for node: `{}`.".format(name) + + node.out_port(0).data.set_shape(np.concatenate((num_segments, weights.shape[1:]), dtype=np.int64)) From bb897c48c827fe0b935d594e75a1d2b451215188 Mon Sep 17 00:00:00 2001 From: Roman Kazantsev Date: Tue, 28 Apr 2020 10:25:42 +0500 Subject: [PATCH 02/31] Transform dynamic sub-graph of Wide and Deep into EmbeddingSegmentsSum - Expressed SparseWeightedSum sub-graph through EmbeddingSegmentsSum - Removed experimental SparseWeightedSum layer - Implemented tests for the transformation Signed-off-by: Roman Kazantsev --- ...ghted_sum.py => embedding_segments_sum.py} | 95 +++++++++++++------ ...test.py => embedding_segments_sum_test.py} | 63 +++++++----- .../extensions/ops/embedding_bag.py | 11 ++- .../extensions/ops/sparse_weighted_sum.py | 57 ----------- .../ops/sparse_weighted_sum_test.py | 67 ------------- 5 files changed, 110 insertions(+), 183 deletions(-) rename model-optimizer/extensions/front/tf/{sparse_weighted_sum.py => embedding_segments_sum.py} (66%) rename model-optimizer/extensions/front/tf/{sparse_weighted_sum_test.py => embedding_segments_sum_test.py} (75%) delete mode 100644 model-optimizer/extensions/ops/sparse_weighted_sum.py delete mode 100644 model-optimizer/extensions/ops/sparse_weighted_sum_test.py diff --git a/model-optimizer/extensions/front/tf/sparse_weighted_sum.py b/model-optimizer/extensions/front/tf/embedding_segments_sum.py similarity index 66% rename from model-optimizer/extensions/front/tf/sparse_weighted_sum.py rename to model-optimizer/extensions/front/tf/embedding_segments_sum.py index 7ea0bb0d28c2cc..88080cd9c08137 100644 --- a/model-optimizer/extensions/front/tf/sparse_weighted_sum.py +++ b/model-optimizer/extensions/front/tf/embedding_segments_sum.py @@ -1,5 +1,5 @@ """ - Copyright (C) 2018-2020 Intel Corporation + Copyright (C) 2020 Intel Corporation Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. @@ -16,12 +16,15 @@ import logging as log -from extensions.ops.sparse_weighted_sum import ExperimentalSparseWeightedSum +from extensions.ops.embedding_bag import EmbeddingSegmentsSum +from extensions.ops.split import Split +from mo.front.common.partial_infer.utils import int64_array from mo.front.common.replacement import FrontReplacementSubgraph -from mo.graph.graph import Graph +from mo.front.tf.graph_utils import create_op_with_const_inputs +from mo.graph.graph import Graph, rename_nodes -class ExperimentalSparseWeightedSumFrontReplacer(FrontReplacementSubgraph): +class EmbeddingSegmentsSumFrontReplacer(FrontReplacementSubgraph): """ The transformation looks for pattern (sub-graph) that performs extraction of embedding vectors from the parameters table for object feature values and sum up these embedding vectors for every object. @@ -30,7 +33,7 @@ class ExperimentalSparseWeightedSumFrontReplacer(FrontReplacementSubgraph): enabled = True def pattern(self): - log.debug('Enabled ExperimentalSparseWeightedSum replacement') + log.debug('Enabled EmbeddingSegmentsSum replacement') return dict( nodes=[ ('identity_spw', dict(op='Identity')), @@ -76,18 +79,31 @@ def replace_sub_graph(self, graph: Graph, match: dict): gather0_2 = match['gather0_2'] greaterequal0 = match['greaterequal0'] sparse_fill_empty_rows = match['sparse_fill_empty_rows'] - where0 = match['where0'] + gather = match['gather'] select = match['select'] - - log.debug('Found ExperimentalSparseWeightedSum2 pattern after {} with name {}'.format(sparse_fill_empty_rows.op, sparse_fill_empty_rows.name)) - - sparse_weighted_sum = ExperimentalSparseWeightedSum(graph, {'name': sparse_fill_empty_rows.name + '/ExperimentalSparseWeightedSum_'}).create_node() - gather0_1.in_port(0).get_connection().set_destination(sparse_weighted_sum.in_port(0)) - greaterequal0.in_port(0).get_connection().set_destination(sparse_weighted_sum.in_port(1)) - identity_spw.in_port(0).get_connection().set_destination(sparse_weighted_sum.in_port(2)) - gather.in_port(0).get_connection().set_destination(sparse_weighted_sum.in_port(3)) - sparse_fill_empty_rows.in_port(3).get_connection().set_destination(sparse_weighted_sum.in_port(4)) + output_node_name = select.soft_get('name', select.id) + log.debug('Found EmbeddingSegmentsSum pattern after {} with name {}'.format(sparse_fill_empty_rows.op, sparse_fill_empty_rows.name)) + + split_for_indices = create_op_with_const_inputs(graph, Split, {1: int64_array(1)}, {'num_splits': 2}) + split_for_dense_shape = create_op_with_const_inputs(graph, Split, {1: int64_array(0)}, {'num_splits': 2}) + abandoned_name = output_node_name + '/AbandonedName' + embedding_segments_sum = EmbeddingSegmentsSum(graph, {'name': abandoned_name}).create_node() + rename_nodes([(select, abandoned_name), (embedding_segments_sum, output_node_name)]) + + # connect parameters table + gather.in_port(0).get_connection().set_destination(embedding_segments_sum.in_port(0)) + # connect indices values + greaterequal0.in_port(0).get_connection().set_destination(embedding_segments_sum.in_port(1)) + # split and connect segment ids + gather0_1.in_port(0).get_connection().set_destination(split_for_indices.in_port(0)) + embedding_segments_sum.in_port(2).connect(split_for_indices.out_port(0)) + # split and connect number of segments + identity_spw.in_port(0).get_connection().set_destination(split_for_dense_shape.in_port(0)) + embedding_segments_sum.in_port(3).connect(split_for_dense_shape.out_port(0)) + # no input port for per_sample_weight + # connect default value + sparse_fill_empty_rows.in_port(3).get_connection().set_destination(embedding_segments_sum.in_port(5)) identity_spw.in_port(0).disconnect() gather0_1.in_port(0).disconnect() @@ -96,11 +112,11 @@ def replace_sub_graph(self, graph: Graph, match: dict): sparse_fill_empty_rows.in_port(2).disconnect() gather.in_port(0).disconnect() - select.out_port(0).get_connection().set_source(sparse_weighted_sum.out_port(0)) - graph.remove_nodes_from([gather0_1.id, gather0_2.id, greaterequal0.id, sparse_fill_empty_rows.id, select.id, where0.id]) + select.out_port(0).get_connection().set_source(embedding_segments_sum.out_port(0)) + graph.remove_nodes_from([gather0_1.id, gather0_2.id, greaterequal0.id, sparse_fill_empty_rows.id, select.id]) -class ExperimentalSparseWeightedSumFrontReplacer2(FrontReplacementSubgraph): +class EmbeddingSegmentsSumFrontReplacer2(FrontReplacementSubgraph): """ The transformation looks for pattern (sub-graph) that performs extraction of embedding vectors from the parameters table for object feature values and sum up these embedding vectors for every object. @@ -109,7 +125,7 @@ class ExperimentalSparseWeightedSumFrontReplacer2(FrontReplacementSubgraph): enabled = True def pattern(self): - log.debug('Enabled ExperimentalSparseWeightedSum2 replacement') + log.debug('Enabled EmbeddingSegmentsSum2 replacement') return dict( nodes=[ ('identity_spw', dict(op='Identity')), @@ -161,16 +177,33 @@ def replace_sub_graph(self, graph: Graph, match: dict): sparse_fill_empty_rows = match['sparse_fill_empty_rows'] gather = match['gather'] select = match['select'] - where0 = match['where0'] - - log.debug('Found ExperimentalSparseWeightedSum2 pattern after {} with name {}'.format(sparse_fill_empty_rows.op, sparse_fill_empty_rows.name)) - - sparse_weighted_sum = ExperimentalSparseWeightedSum(graph, {'name': sparse_fill_empty_rows.name + '/ExperimentalSparseWeightedSum_'}).create_node() - gather0_1.in_port(0).get_connection().set_destination(sparse_weighted_sum.in_port(0)) - greaterequal0.in_port(0).get_connection().set_destination(sparse_weighted_sum.in_port(1)) - identity_spw.in_port(0).get_connection().set_destination(sparse_weighted_sum.in_port(2)) - gather.in_port(0).get_connection().set_destination(sparse_weighted_sum.in_port(3)) - sparse_fill_empty_rows.in_port(3).get_connection().set_destination(sparse_weighted_sum.in_port(4)) + output_node_name = select.soft_get('name', select.id) + + log.debug('Found EmbeddingSegmentsSum2 pattern after {} with name {}'.format(sparse_fill_empty_rows.op, sparse_fill_empty_rows.name)) + + split_for_indices = create_op_with_const_inputs(graph, Split, {1: int64_array(1)}, + {'num_splits': 2, + 'name': output_node_name + '/SplitForIndices'}) + split_for_dense_shape = create_op_with_const_inputs(graph, Split, {1: int64_array(0)}, + {'num_splits': 2, + 'name': output_node_name + '/SplitForDenseShape'}) + abandoned_name = output_node_name + '/AbandonedName' + embedding_segments_sum = EmbeddingSegmentsSum(graph, {'name': abandoned_name}).create_node() + rename_nodes([(select, abandoned_name), (embedding_segments_sum, output_node_name)]) + + # connect parameters table + gather.in_port(0).get_connection().set_destination(embedding_segments_sum.in_port(0)) + # connect indices values + greaterequal0.in_port(0).get_connection().set_destination(embedding_segments_sum.in_port(1)) + # split and connect segment ids + gather0_1.in_port(0).get_connection().set_destination(split_for_indices.in_port(0)) + embedding_segments_sum.in_port(2).connect(split_for_indices.out_port(0)) + # split and connect number of segments + identity_spw.in_port(0).get_connection().set_destination(split_for_dense_shape.in_port(0)) + embedding_segments_sum.in_port(3).connect(split_for_dense_shape.out_port(0)) + # no input port for per_sample_weight + # connect default value + sparse_fill_empty_rows.in_port(3).get_connection().set_destination(embedding_segments_sum.in_port(5)) identity_spw.in_port(0).disconnect() gather0_1.in_port(0).disconnect() @@ -179,5 +212,5 @@ def replace_sub_graph(self, graph: Graph, match: dict): sparse_fill_empty_rows.in_port(2).disconnect() gather.in_port(0).disconnect() - select.out_port(0).get_connection().set_source(sparse_weighted_sum.out_port(0)) - graph.remove_nodes_from([gather0_1.id, gather0_2.id, greaterequal0.id, sparse_fill_empty_rows.id, select.id, where0.id]) + select.out_port(0).get_connection().set_source(embedding_segments_sum.out_port(0)) + graph.remove_nodes_from([gather0_1.id, gather0_2.id, greaterequal0.id, sparse_fill_empty_rows.id, select.id]) diff --git a/model-optimizer/extensions/front/tf/sparse_weighted_sum_test.py b/model-optimizer/extensions/front/tf/embedding_segments_sum_test.py similarity index 75% rename from model-optimizer/extensions/front/tf/sparse_weighted_sum_test.py rename to model-optimizer/extensions/front/tf/embedding_segments_sum_test.py index becbac324f93ca..e958a3041e534e 100644 --- a/model-optimizer/extensions/front/tf/sparse_weighted_sum_test.py +++ b/model-optimizer/extensions/front/tf/embedding_segments_sum_test.py @@ -1,5 +1,5 @@ """ - Copyright (C) 2018-2020 Intel Corporation + Copyright (C) 2020 Intel Corporation Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. @@ -16,14 +16,13 @@ import unittest -from extensions.front.tf.sparse_weighted_sum import ExperimentalSparseWeightedSumFrontReplacer, \ - ExperimentalSparseWeightedSumFrontReplacer2 +from extensions.front.tf.embedding_segments_sum import EmbeddingSegmentsSumFrontReplacer, EmbeddingSegmentsSumFrontReplacer2 from mo.front.common.partial_infer.utils import int64_array from mo.utils.ir_engine.compare_graphs import compare_graphs -from mo.utils.unittest.graph import build_graph +from mo.utils.unittest.graph import build_graph, const -class ExperimentalSparseWeightedSumFrontReplacersTest(unittest.TestCase): +class EmbeddingSegmentsSumFrontReplacerFrontReplacersTest(unittest.TestCase): def test1(self): nodes_attributes = { 'input_indices': {'shape': int64_array([5, 2]), 'type': 'Parameter', 'kind': 'op', 'op': 'Parameter'}, @@ -48,7 +47,12 @@ def test1(self): 'tile': {'kind': 'op', 'op': 'Tile', 'type': 'Tile'}, 'select': {'kind': 'op', 'op': 'Select'}, - 'sparse_weighted_sum': {'kind': 'op', 'op': 'ExperimentalSparseWeightedSum'}, + 'split_for_indices': {'kind': 'op', 'op': 'Split'}, + 'split_for_dense_shape': {'kind': 'op', 'op': 'Split'}, + 'embedding_segments_sum': {'kind': 'op', 'op': 'EmbeddingSegmentsSum'}, + + **const('split_for_indices_axis', int64_array(1)), + **const('split_for_dense_shape_axis', int64_array(0)), 'last': {'type': None, 'value': None, 'kind': 'op', 'op': 'Result'}, } @@ -82,16 +86,20 @@ def test1(self): ('select', 'last', {'out': 0, 'in': 0}), ], nodes_with_edges_only=True) graph.stage = 'front' - ExperimentalSparseWeightedSumFrontReplacer().find_and_replace_pattern(graph) + EmbeddingSegmentsSumFrontReplacer().find_and_replace_pattern(graph) graph_ref = build_graph(nodes_attributes, - [('input_indices', 'sparse_weighted_sum', {'in': 0}), - ('input_values', 'sparse_weighted_sum', {'in': 1}), - ('input_dense_shape', 'sparse_weighted_sum', {'in': 2}), - ('input_params_table', 'sparse_weighted_sum', {'in': 3}), - ('input_default_value', 'sparse_weighted_sum', {'in': 4}), - ('sparse_weighted_sum', 'last', {'in': 0}),], - nodes_with_edges_only=True) + [('input_indices', 'split_for_indices', {'in': 0}), + ('split_for_indices_axis', 'split_for_indices', {'in': 1}), + ('split_for_indices', 'embedding_segments_sum', {'in': 2, 'out': 0}), + ('input_values', 'embedding_segments_sum', {'in': 1}), + ('input_dense_shape', 'split_for_dense_shape', {'in': 0}), + ('split_for_dense_shape_axis', 'split_for_dense_shape', {'in': 1}), + ('split_for_dense_shape', 'embedding_segments_sum', {'in': 3, 'out': 0}), + ('input_params_table', 'embedding_segments_sum', {'in': 0}), + ('input_default_value', 'embedding_segments_sum', {'in': 5}), + ('embedding_segments_sum', 'last', {'in': 0}),], + nodes_with_edges_only=True) (flag, resp) = compare_graphs(graph, graph_ref, 'last', check_op_attrs=True) self.assertTrue(flag, resp) @@ -122,7 +130,12 @@ def test2(self): 'tile': {'kind': 'op', 'op': 'Tile', 'type': 'Tile'}, 'select': {'kind': 'op', 'op': 'Select'}, - 'sparse_weighted_sum': {'kind': 'op', 'op': 'ExperimentalSparseWeightedSum'}, + 'split_for_indices': {'kind': 'op', 'op': 'Split'}, + 'split_for_dense_shape': {'kind': 'op', 'op': 'Split'}, + 'embedding_segments_sum': {'kind': 'op', 'op': 'EmbeddingSegmentsSum'}, + + **const('split_for_indices_axis', int64_array(1)), + **const('split_for_dense_shape_axis', int64_array(0)), 'last': {'type': None, 'value': None, 'kind': 'op', 'op': 'Result'}, } @@ -158,16 +171,20 @@ def test2(self): ('select', 'last', {'out': 0, 'in': 0})], nodes_with_edges_only=True) graph.stage = 'front' - ExperimentalSparseWeightedSumFrontReplacer2().find_and_replace_pattern(graph) + EmbeddingSegmentsSumFrontReplacer2().find_and_replace_pattern(graph) graph_ref = build_graph(nodes_attributes, - [('input_indices', 'sparse_weighted_sum', {'in': 0}), - ('input_values', 'sparse_weighted_sum', {'in': 1}), - ('input_dense_shape', 'sparse_weighted_sum', {'in': 2}), - ('input_params_table', 'sparse_weighted_sum', {'in': 3}), - ('input_default_value', 'sparse_weighted_sum', {'in': 4}), - ('sparse_weighted_sum', 'last', {'in': 0}),], - nodes_with_edges_only=True) + [('input_indices', 'split_for_indices', {'in': 0}), + ('split_for_indices_axis', 'split_for_indices', {'in': 1}), + ('split_for_indices', 'embedding_segments_sum', {'in': 2, 'out': 0}), + ('input_values', 'embedding_segments_sum', {'in': 1}), + ('input_dense_shape', 'split_for_dense_shape', {'in': 0}), + ('split_for_dense_shape_axis', 'split_for_dense_shape', {'in': 1}), + ('split_for_dense_shape', 'embedding_segments_sum', {'in': 3, 'out': 0}), + ('input_params_table', 'embedding_segments_sum', {'in': 0}), + ('input_default_value', 'embedding_segments_sum', {'in': 5}), + ('embedding_segments_sum', 'last', {'in': 0}),], + nodes_with_edges_only=True) (flag, resp) = compare_graphs(graph, graph_ref, 'last', check_op_attrs=True) self.assertTrue(flag, resp) diff --git a/model-optimizer/extensions/ops/embedding_bag.py b/model-optimizer/extensions/ops/embedding_bag.py index 0597b49fe4b2a6..132fe40d003a16 100644 --- a/model-optimizer/extensions/ops/embedding_bag.py +++ b/model-optimizer/extensions/ops/embedding_bag.py @@ -14,6 +14,7 @@ limitations under the License. """ +from mo.front.common.partial_infer.utils import int64_array from mo.graph.graph import Node, Graph from mo.ops.op import Op @@ -111,10 +112,10 @@ def infer(node: Node): "EmbeddingSegmentsSum should have at least 4 connected input port, but it doesn't for node: `{}`. " \ "Ports: {}".format(name, connected_in_ports) - weights = node.in_port(0).data.get_value() - assert weights is not None and len(weights.shape) >= 2 - num_segments = node.in_port(2).data.get_value() + weights_shape = node.in_port(0).data.get_shape() + assert len(weights_shape) >= 2 + num_segments = node.in_port(3).data.get_value() assert num_segments is not None, "EmbeddingSegmentsSum should have a constant num_segments provided, but it " \ "doesn't for node: `{}`.".format(name) - - node.out_port(0).data.set_shape(np.concatenate((num_segments, weights.shape[1:]), dtype=np.int64)) + output_shape = int64_array(num_segments.tolist() + weights_shape[1:].tolist()) + node.out_port(0).data.set_shape(output_shape) diff --git a/model-optimizer/extensions/ops/sparse_weighted_sum.py b/model-optimizer/extensions/ops/sparse_weighted_sum.py deleted file mode 100644 index ff76b211f1c3de..00000000000000 --- a/model-optimizer/extensions/ops/sparse_weighted_sum.py +++ /dev/null @@ -1,57 +0,0 @@ -""" - Copyright (C) 2018-2020 Intel Corporation - - Licensed under the Apache License, Version 2.0 (the "License"); - you may not use this file except in compliance with the License. - You may obtain a copy of the License at - - http://www.apache.org/licenses/LICENSE-2.0 - - Unless required by applicable law or agreed to in writing, software - distributed under the License is distributed on an "AS IS" BASIS, - WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - See the License for the specific language governing permissions and - limitations under the License. -""" - -from mo.front.common.partial_infer.utils import int64_array -from mo.graph.graph import Node, Graph -from mo.ops.op import Op - - -class ExperimentalSparseWeightedSum(Op): - op = 'ExperimentalSparseWeightedSum' - enabled = True - - def __init__(self, graph: Graph, attrs: dict): - super().__init__(graph, { - 'type': __class__.op, - 'op': __class__.op, - 'version': 'experimental', - 'reduce_op': None, - 'type_infer': self.type_infer, - 'infer': self.infer, - 'in_ports_count': 6, - 'out_ports_count': 1, - }, attrs) - - def supported_attrs(self): - return [] - - @staticmethod - def type_infer(node): - # the output type must be the same as the parameters table type - params_table_type = node.in_port(3).get_data_type() - node.out_port(0).set_data_type(params_table_type) - - @staticmethod - def infer(node: Node): - assert len(node.in_nodes()) == 5 or len(node.in_nodes()) == 6, \ - "Incorrect number of inputs for {} node".format(node.id) - - batch_size = node.in_port(2).data.get_value()[0] - num_features = node.in_port(3).data.get_shape()[1:] - output_shape = int64_array([batch_size] + num_features.tolist()) - node.out_port(0).data.set_shape(output_shape) - - # TODO: implement output value computation if all input is constant diff --git a/model-optimizer/extensions/ops/sparse_weighted_sum_test.py b/model-optimizer/extensions/ops/sparse_weighted_sum_test.py deleted file mode 100644 index 0f1b40028d5af2..00000000000000 --- a/model-optimizer/extensions/ops/sparse_weighted_sum_test.py +++ /dev/null @@ -1,67 +0,0 @@ -""" - Copyright (C) 2018-2020 Intel Corporation - - Licensed under the Apache License, Version 2.0 (the "License"); - you may not use this file except in compliance with the License. - You may obtain a copy of the License at - - http://www.apache.org/licenses/LICENSE-2.0 - - Unless required by applicable law or agreed to in writing, software - distributed under the License is distributed on an "AS IS" BASIS, - WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - See the License for the specific language governing permissions and - limitations under the License. -""" - -import unittest - -import numpy as np - -from extensions.ops.sparse_weighted_sum import ExperimentalSparseWeightedSum -from mo.front.common.partial_infer.utils import int64_array -from mo.graph.graph import Node -from mo.utils.unittest.graph import build_graph - -nodes_attributes = {'input_indices': {'shape': None, 'value': None, 'kind': 'data'}, - 'input_values': {'shape': None, 'value': None, 'kind': 'data'}, - 'input_dense_shape': {'shape': None, 'value': None, 'kind': 'data'}, - 'input_params_table': {'shape': None, 'value': None, 'kind': 'data'}, - 'input_default_value': {'shape': None, 'value': None, 'kind': 'data'}, - 'input_weights': {'shape': None, 'value': None, 'kind': 'data'}, - 'sparse_weighted_sum_node': {'op': 'ExperimentalSparseWeightedSum', 'kind': 'op'}, - 'output': {'shape': None, 'value': None, 'kind': 'data'}} - -# graph 1 -edges1 = [('input_indices', 'sparse_weighted_sum_node', {'in': 0}), - ('input_values', 'sparse_weighted_sum_node', {'in': 1}), - ('input_dense_shape', 'sparse_weighted_sum_node', {'in': 2}), - ('input_params_table', 'sparse_weighted_sum_node', {'in': 3}), - ('input_default_value', 'sparse_weighted_sum_node', {'in': 4}), - ('input_weights', 'sparse_weighted_sum_node', {'in': 5}), - ('sparse_weighted_sum_node', 'output', {'out': 0})] - -inputs1 = {'input_indices': {'shape': int64_array([5, 2]), 'value': None}, - 'input_values': {'shape': int64_array([5]), 'value': None}, - 'input_dense_shape': {'shape': int64_array([2]), 'value': int64_array([4, 3])}, - 'input_params_table': {'shape': int64_array([100, 4, 5]), 'value': None}, - 'input_default_value': {'shape': int64_array([]), 'value': 100.0}, - 'input_weights': {'shape': int64_array([5]), 'value': None}} - - -class TestExperimentalSparseWeightedSum(unittest.TestCase): - def test_partial_infer1(self): - graph = build_graph(nodes_attributes, edges1, inputs1) - sparse_weighted_sum_node = Node(graph, 'sparse_weighted_sum_node') - ExperimentalSparseWeightedSum.infer(sparse_weighted_sum_node) - - # prepare reference results - ref_output_shape = np.array([4, 4, 5], dtype=np.int32) - - # get the result - res_output_shape = graph.node['output']['shape'] - - self.assertTrue(np.array_equal(ref_output_shape, res_output_shape), - 'shapes do not match expected: {} and given: {}'.format(ref_output_shape, res_output_shape)) - - From 3a86aff155b4707daa318349d18eec4cbe0590e9 Mon Sep 17 00:00:00 2001 From: "Maxim, Vafin" Date: Thu, 30 Apr 2020 13:57:40 +0300 Subject: [PATCH 03/31] Fix EmbeddingBag shape infer --- model-optimizer/extensions/ops/embedding_bag.py | 12 ++++++------ 1 file changed, 6 insertions(+), 6 deletions(-) diff --git a/model-optimizer/extensions/ops/embedding_bag.py b/model-optimizer/extensions/ops/embedding_bag.py index 132fe40d003a16..60467ced8498f3 100644 --- a/model-optimizer/extensions/ops/embedding_bag.py +++ b/model-optimizer/extensions/ops/embedding_bag.py @@ -45,14 +45,14 @@ def infer(node: Node): 2 in connected_in_ports, "EmbeddingBag should have at least 3 connected input port, but it doesn't " \ "for node: `{}`. Ports: {}".format(name, connected_in_ports) - weights = node.in_port(0).data.get_value() - assert weights is not None and len(weights.shape) >= 2 + weights_shape = node.in_port(0).data.get_shape() + assert len(weights_shape) >= 2 input_shape = node.in_port(1).data.get_shape() assert input_shape is not None offsets_shape = node.in_port(2).data.get_shape() assert offsets_shape is not None and len(offsets_shape) == 1 - node.out_port(0).data.set_shape(np.concatenate((input_shape[0], weights.shape[1:]), dtype=np.int64)) + node.out_port(0).data.set_shape(np.concatenate((input_shape[:1], weights_shape[1:]), dtype=np.int64)) class EmbeddingBagPackedSum(Op): @@ -79,12 +79,12 @@ def infer(node: Node): "EmbeddingBagPackedSum should have at least 2 connected input port, but it doesn't for node: `{}`. " \ "Ports: {}".format(name, connected_in_ports) - weights = node.in_port(0).data.get_value() - assert weights is not None and len(weights.shape) >= 2 + weights_shape = node.in_port(0).data.get_shape() + assert len(weights_shape) >= 2 input_shape = node.in_port(1).data.get_shape() assert input_shape is not None - node.out_port(0).data.set_shape(np.concatenate((input_shape[0], weights.shape[1:]), dtype=np.int64)) + node.out_port(0).data.set_shape(np.concatenate((input_shape[:1], weights_shape[1:]), dtype=np.int64)) class EmbeddingSegmentsSum(Op): From 40295be3c6bb6f41d80c7ddf8587820d6a7c9c65 Mon Sep 17 00:00:00 2001 From: Roman Kazantsev Date: Thu, 7 May 2020 18:06:25 +0500 Subject: [PATCH 04/31] Fix EmbeddingSegmentsSum transformation for Wide and Deep Signed-off-by: Roman Kazantsev --- .../front/tf/embedding_segments_sum.py | 19 +++++++++------- .../front/tf/embedding_segments_sum_test.py | 12 ++++++++-- .../extensions/middle/sparse_reshape.py | 22 ++++++++++++++----- .../extensions/ops/embedding_bag.py | 2 +- 4 files changed, 38 insertions(+), 17 deletions(-) diff --git a/model-optimizer/extensions/front/tf/embedding_segments_sum.py b/model-optimizer/extensions/front/tf/embedding_segments_sum.py index 88080cd9c08137..1c135849d1948f 100644 --- a/model-optimizer/extensions/front/tf/embedding_segments_sum.py +++ b/model-optimizer/extensions/front/tf/embedding_segments_sum.py @@ -22,6 +22,7 @@ from mo.front.common.replacement import FrontReplacementSubgraph from mo.front.tf.graph_utils import create_op_with_const_inputs from mo.graph.graph import Graph, rename_nodes +from mo.ops.squeeze import Squeeze class EmbeddingSegmentsSumFrontReplacer(FrontReplacementSubgraph): @@ -87,9 +88,9 @@ def replace_sub_graph(self, graph: Graph, match: dict): split_for_indices = create_op_with_const_inputs(graph, Split, {1: int64_array(1)}, {'num_splits': 2}) split_for_dense_shape = create_op_with_const_inputs(graph, Split, {1: int64_array(0)}, {'num_splits': 2}) - abandoned_name = output_node_name + '/AbandonedName' - embedding_segments_sum = EmbeddingSegmentsSum(graph, {'name': abandoned_name}).create_node() - rename_nodes([(select, abandoned_name), (embedding_segments_sum, output_node_name)]) + squeeze_to_scalar = create_op_with_const_inputs(graph, Squeeze, {1: int64_array([0])}) + embedding_segments_sum = EmbeddingSegmentsSum(graph, {'name': output_node_name}).create_node() + rename_nodes([(select, output_node_name + '/AbandonedName'), (embedding_segments_sum, output_node_name)]) # connect parameters table gather.in_port(0).get_connection().set_destination(embedding_segments_sum.in_port(0)) @@ -100,7 +101,8 @@ def replace_sub_graph(self, graph: Graph, match: dict): embedding_segments_sum.in_port(2).connect(split_for_indices.out_port(0)) # split and connect number of segments identity_spw.in_port(0).get_connection().set_destination(split_for_dense_shape.in_port(0)) - embedding_segments_sum.in_port(3).connect(split_for_dense_shape.out_port(0)) + squeeze_to_scalar.in_port(0).connect(split_for_dense_shape.out_port(0)) + embedding_segments_sum.in_port(3).connect(squeeze_to_scalar.out_port(0)) # no input port for per_sample_weight # connect default value sparse_fill_empty_rows.in_port(3).get_connection().set_destination(embedding_segments_sum.in_port(5)) @@ -187,9 +189,9 @@ def replace_sub_graph(self, graph: Graph, match: dict): split_for_dense_shape = create_op_with_const_inputs(graph, Split, {1: int64_array(0)}, {'num_splits': 2, 'name': output_node_name + '/SplitForDenseShape'}) - abandoned_name = output_node_name + '/AbandonedName' - embedding_segments_sum = EmbeddingSegmentsSum(graph, {'name': abandoned_name}).create_node() - rename_nodes([(select, abandoned_name), (embedding_segments_sum, output_node_name)]) + squeeze_to_scalar = create_op_with_const_inputs(graph, Squeeze, {1: int64_array([0])}) + embedding_segments_sum = EmbeddingSegmentsSum(graph, {'name': output_node_name}).create_node() + rename_nodes([(select, output_node_name + '/AbandonedName'), (embedding_segments_sum, output_node_name)]) # connect parameters table gather.in_port(0).get_connection().set_destination(embedding_segments_sum.in_port(0)) @@ -200,7 +202,8 @@ def replace_sub_graph(self, graph: Graph, match: dict): embedding_segments_sum.in_port(2).connect(split_for_indices.out_port(0)) # split and connect number of segments identity_spw.in_port(0).get_connection().set_destination(split_for_dense_shape.in_port(0)) - embedding_segments_sum.in_port(3).connect(split_for_dense_shape.out_port(0)) + squeeze_to_scalar.in_port(0).connect(split_for_dense_shape.out_port(0)) + embedding_segments_sum.in_port(3).connect(squeeze_to_scalar.out_port(0)) # no input port for per_sample_weight # connect default value sparse_fill_empty_rows.in_port(3).get_connection().set_destination(embedding_segments_sum.in_port(5)) diff --git a/model-optimizer/extensions/front/tf/embedding_segments_sum_test.py b/model-optimizer/extensions/front/tf/embedding_segments_sum_test.py index e958a3041e534e..de9af2af604c73 100644 --- a/model-optimizer/extensions/front/tf/embedding_segments_sum_test.py +++ b/model-optimizer/extensions/front/tf/embedding_segments_sum_test.py @@ -49,10 +49,12 @@ def test1(self): 'split_for_indices': {'kind': 'op', 'op': 'Split'}, 'split_for_dense_shape': {'kind': 'op', 'op': 'Split'}, + 'squeeze_to_scalar': {'kind': 'op', 'op': 'Squeeze'}, 'embedding_segments_sum': {'kind': 'op', 'op': 'EmbeddingSegmentsSum'}, **const('split_for_indices_axis', int64_array(1)), **const('split_for_dense_shape_axis', int64_array(0)), + **const('squeeze_axis', int64_array([0])), 'last': {'type': None, 'value': None, 'kind': 'op', 'op': 'Result'}, } @@ -95,7 +97,9 @@ def test1(self): ('input_values', 'embedding_segments_sum', {'in': 1}), ('input_dense_shape', 'split_for_dense_shape', {'in': 0}), ('split_for_dense_shape_axis', 'split_for_dense_shape', {'in': 1}), - ('split_for_dense_shape', 'embedding_segments_sum', {'in': 3, 'out': 0}), + ('split_for_dense_shape', 'squeeze_to_scalar', {'in': 0}), + ('squeeze_axis', 'squeeze_to_scalar', {'in': 1}), + ('squeeze_to_scalar', 'embedding_segments_sum', {'in': 3, 'out': 0}), ('input_params_table', 'embedding_segments_sum', {'in': 0}), ('input_default_value', 'embedding_segments_sum', {'in': 5}), ('embedding_segments_sum', 'last', {'in': 0}),], @@ -132,10 +136,12 @@ def test2(self): 'split_for_indices': {'kind': 'op', 'op': 'Split'}, 'split_for_dense_shape': {'kind': 'op', 'op': 'Split'}, + 'squeeze_to_scalar': {'kind': 'op', 'op': 'Squeeze'}, 'embedding_segments_sum': {'kind': 'op', 'op': 'EmbeddingSegmentsSum'}, **const('split_for_indices_axis', int64_array(1)), **const('split_for_dense_shape_axis', int64_array(0)), + **const('squeeze_axis', int64_array([0])), 'last': {'type': None, 'value': None, 'kind': 'op', 'op': 'Result'}, } @@ -180,7 +186,9 @@ def test2(self): ('input_values', 'embedding_segments_sum', {'in': 1}), ('input_dense_shape', 'split_for_dense_shape', {'in': 0}), ('split_for_dense_shape_axis', 'split_for_dense_shape', {'in': 1}), - ('split_for_dense_shape', 'embedding_segments_sum', {'in': 3, 'out': 0}), + ('split_for_dense_shape', 'squeeze_to_scalar', {'in': 0}), + ('squeeze_axis', 'squeeze_to_scalar', {'in': 1}), + ('squeeze_to_scalar', 'embedding_segments_sum', {'in': 3, 'out': 0}), ('input_params_table', 'embedding_segments_sum', {'in': 0}), ('input_default_value', 'embedding_segments_sum', {'in': 5}), ('embedding_segments_sum', 'last', {'in': 0}),], diff --git a/model-optimizer/extensions/middle/sparse_reshape.py b/model-optimizer/extensions/middle/sparse_reshape.py index eeaa381555398a..f4670e3992c6a1 100644 --- a/model-optimizer/extensions/middle/sparse_reshape.py +++ b/model-optimizer/extensions/middle/sparse_reshape.py @@ -46,6 +46,14 @@ def replace_pattern(self, graph: Graph, match: dict): input_shape_value = sparse_reshape.in_port(1).data.get_value() output_shape_value = sparse_reshape.out_port(1).data.get_value() + # establish output shape if value of new shape is given as input + new_shape_value = sparse_reshape.in_port(2).data.get_value() + if output_shape_value is None and new_shape_value is not None: + output_shape_value = new_shape_value + if np.count_nonzero(output_shape_value == -1) == 1: + elem = np.prod(input_shape_value) // np.prod(new_shape_value[new_shape_value != -1]) + output_shape_value[output_shape_value == -1] = elem + if input_shape_value is None or output_shape_value is None: raise Error("Input shape and output shape values must be defined for node {}".format(sparse_reshape.id)) if not np.array_equal(input_shape_value, output_shape_value): @@ -53,14 +61,16 @@ def replace_pattern(self, graph: Graph, match: dict): input_data_node1 = sparse_reshape.in_node(0) input_data_node2 = sparse_reshape.in_node(1) - output_data_node1 = sparse_reshape.out_node(0) - output_data_node2 = sparse_reshape.out_node(1) graph.remove_edge(input_data_node1.id, sparse_reshape.id) - graph.remove_edge(sparse_reshape.id, output_data_node1.id) graph.remove_edge(input_data_node2.id, sparse_reshape.id) - graph.remove_edge(sparse_reshape.id, output_data_node2.id) - merge_data_nodes(graph, output_data_node1, input_data_node1) - merge_data_nodes(graph, output_data_node2, input_data_node2) + if 0 in sparse_reshape.out_nodes(): + output_data_node1 = sparse_reshape.out_node(0) + graph.remove_edge(sparse_reshape.id, output_data_node1.id) + merge_data_nodes(graph, output_data_node1, input_data_node1) + if 1 in sparse_reshape.out_nodes(): + output_data_node2 = sparse_reshape.out_node(1) + graph.remove_edge(sparse_reshape.id, output_data_node2.id) + merge_data_nodes(graph, output_data_node2, input_data_node2) graph.remove_nodes_from([sparse_reshape.id, input_data_node1.id, input_data_node2.id]) # TODO: investigate why this second way does not work diff --git a/model-optimizer/extensions/ops/embedding_bag.py b/model-optimizer/extensions/ops/embedding_bag.py index 60467ced8498f3..b08235932d014c 100644 --- a/model-optimizer/extensions/ops/embedding_bag.py +++ b/model-optimizer/extensions/ops/embedding_bag.py @@ -117,5 +117,5 @@ def infer(node: Node): num_segments = node.in_port(3).data.get_value() assert num_segments is not None, "EmbeddingSegmentsSum should have a constant num_segments provided, but it " \ "doesn't for node: `{}`.".format(name) - output_shape = int64_array(num_segments.tolist() + weights_shape[1:].tolist()) + output_shape = int64_array([num_segments] + weights_shape[1:].tolist()) node.out_port(0).data.set_shape(output_shape) From 725a1bb549646d273d39593bfae04ea2488c33d1 Mon Sep 17 00:00:00 2001 From: Roman Kazantsev Date: Wed, 13 May 2020 17:13:17 +0500 Subject: [PATCH 05/31] Fix EmbeddingSegmentSum replacer after ports swap Signed-off-by: Roman Kazantsev --- .../extensions/front/tf/embedding_segments_sum.py | 10 +++++----- .../extensions/front/tf/embedding_segments_sum_test.py | 4 ++-- 2 files changed, 7 insertions(+), 7 deletions(-) diff --git a/model-optimizer/extensions/front/tf/embedding_segments_sum.py b/model-optimizer/extensions/front/tf/embedding_segments_sum.py index 1c135849d1948f..2e0d4c0e851a1f 100644 --- a/model-optimizer/extensions/front/tf/embedding_segments_sum.py +++ b/model-optimizer/extensions/front/tf/embedding_segments_sum.py @@ -103,9 +103,9 @@ def replace_sub_graph(self, graph: Graph, match: dict): identity_spw.in_port(0).get_connection().set_destination(split_for_dense_shape.in_port(0)) squeeze_to_scalar.in_port(0).connect(split_for_dense_shape.out_port(0)) embedding_segments_sum.in_port(3).connect(squeeze_to_scalar.out_port(0)) - # no input port for per_sample_weight # connect default value - sparse_fill_empty_rows.in_port(3).get_connection().set_destination(embedding_segments_sum.in_port(5)) + sparse_fill_empty_rows.in_port(3).get_connection().set_destination(embedding_segments_sum.in_port(4)) + # no input port for per_sample_weight identity_spw.in_port(0).disconnect() gather0_1.in_port(0).disconnect() @@ -203,10 +203,10 @@ def replace_sub_graph(self, graph: Graph, match: dict): # split and connect number of segments identity_spw.in_port(0).get_connection().set_destination(split_for_dense_shape.in_port(0)) squeeze_to_scalar.in_port(0).connect(split_for_dense_shape.out_port(0)) - embedding_segments_sum.in_port(3).connect(squeeze_to_scalar.out_port(0)) - # no input port for per_sample_weight + embedding_segments_sum.in_port(3).connect(squeeze_to_scalar.out_port(0)) # connect default value - sparse_fill_empty_rows.in_port(3).get_connection().set_destination(embedding_segments_sum.in_port(5)) + sparse_fill_empty_rows.in_port(3).get_connection().set_destination(embedding_segments_sum.in_port(4)) + # no input port for per_sample_weight identity_spw.in_port(0).disconnect() gather0_1.in_port(0).disconnect() diff --git a/model-optimizer/extensions/front/tf/embedding_segments_sum_test.py b/model-optimizer/extensions/front/tf/embedding_segments_sum_test.py index de9af2af604c73..7e8aff025cf256 100644 --- a/model-optimizer/extensions/front/tf/embedding_segments_sum_test.py +++ b/model-optimizer/extensions/front/tf/embedding_segments_sum_test.py @@ -101,7 +101,7 @@ def test1(self): ('squeeze_axis', 'squeeze_to_scalar', {'in': 1}), ('squeeze_to_scalar', 'embedding_segments_sum', {'in': 3, 'out': 0}), ('input_params_table', 'embedding_segments_sum', {'in': 0}), - ('input_default_value', 'embedding_segments_sum', {'in': 5}), + ('input_default_value', 'embedding_segments_sum', {'in': 4}), ('embedding_segments_sum', 'last', {'in': 0}),], nodes_with_edges_only=True) @@ -190,7 +190,7 @@ def test2(self): ('squeeze_axis', 'squeeze_to_scalar', {'in': 1}), ('squeeze_to_scalar', 'embedding_segments_sum', {'in': 3, 'out': 0}), ('input_params_table', 'embedding_segments_sum', {'in': 0}), - ('input_default_value', 'embedding_segments_sum', {'in': 5}), + ('input_default_value', 'embedding_segments_sum', {'in': 4}), ('embedding_segments_sum', 'last', {'in': 0}),], nodes_with_edges_only=True) From f4bcd887adbb55c3c65670336d2587e87cd6dc35 Mon Sep 17 00:00:00 2001 From: Roman Kazantsev Date: Wed, 13 May 2020 17:20:01 +0500 Subject: [PATCH 06/31] Update package_BOM.txt Signed-off-by: Roman Kazantsev --- model-optimizer/automation/package_BOM.txt | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/model-optimizer/automation/package_BOM.txt b/model-optimizer/automation/package_BOM.txt index 2d19e07fbcb815..1c7015e4083c8b 100644 --- a/model-optimizer/automation/package_BOM.txt +++ b/model-optimizer/automation/package_BOM.txt @@ -362,6 +362,7 @@ extensions/front/tf/cumsum_ext.py extensions/front/tf/deconv_ext.py extensions/front/tf/depth_to_space.py extensions/front/tf/elementwise_ext.py +extensions/front/tf/embedding_segments_sum.py extensions/front/tf/expand_dims_ext.py extensions/front/tf/extract_image_patches_ext.py extensions/front/tf/fake_const_ext.py @@ -435,7 +436,6 @@ extensions/front/tf/sparse_segment_mean_ext.py extensions/front/tf/sparse_segment_sqrtn_ext.py extensions/front/tf/sparse_segment_sum_ext.py extensions/front/tf/sparse_to_dense_ext.py -extensions/front/tf/sparse_weighted_sum.py extensions/front/tf/split_ext.py extensions/front/tf/ssd_support.json extensions/front/tf/ssd_support_api_v1.14.json From 05b1fafbc28b4805e4752b7e35397326f99a961e Mon Sep 17 00:00:00 2001 From: "Maxim, Vafin" Date: Fri, 15 May 2020 13:58:37 +0300 Subject: [PATCH 07/31] Add unit tests for EmbeddingXXX shape infer --- .../extensions/ops/embedding_bag.py | 6 +- .../extensions/ops/embedding_bag_test.py | 89 +++++++++++++++++++ 2 files changed, 92 insertions(+), 3 deletions(-) create mode 100644 model-optimizer/extensions/ops/embedding_bag_test.py diff --git a/model-optimizer/extensions/ops/embedding_bag.py b/model-optimizer/extensions/ops/embedding_bag.py index b08235932d014c..28441e974efcf2 100644 --- a/model-optimizer/extensions/ops/embedding_bag.py +++ b/model-optimizer/extensions/ops/embedding_bag.py @@ -52,7 +52,7 @@ def infer(node: Node): offsets_shape = node.in_port(2).data.get_shape() assert offsets_shape is not None and len(offsets_shape) == 1 - node.out_port(0).data.set_shape(np.concatenate((input_shape[:1], weights_shape[1:]), dtype=np.int64)) + node.out_port(0).data.set_shape(np.concatenate((offsets_shape[:1], weights_shape[1:])).astype(np.int64)) class EmbeddingBagPackedSum(Op): @@ -84,7 +84,7 @@ def infer(node: Node): input_shape = node.in_port(1).data.get_shape() assert input_shape is not None - node.out_port(0).data.set_shape(np.concatenate((input_shape[:1], weights_shape[1:]), dtype=np.int64)) + node.out_port(0).data.set_shape(np.concatenate((input_shape[:1], weights_shape[1:])).astype(np.int64)) class EmbeddingSegmentsSum(Op): @@ -117,5 +117,5 @@ def infer(node: Node): num_segments = node.in_port(3).data.get_value() assert num_segments is not None, "EmbeddingSegmentsSum should have a constant num_segments provided, but it " \ "doesn't for node: `{}`.".format(name) - output_shape = int64_array([num_segments] + weights_shape[1:].tolist()) + output_shape = np.concatenate(([num_segments], weights_shape[1:])).astype(np.int64) node.out_port(0).data.set_shape(output_shape) diff --git a/model-optimizer/extensions/ops/embedding_bag_test.py b/model-optimizer/extensions/ops/embedding_bag_test.py new file mode 100644 index 00000000000000..4c59a0cbe3bd64 --- /dev/null +++ b/model-optimizer/extensions/ops/embedding_bag_test.py @@ -0,0 +1,89 @@ +""" + Copyright (C) 2018-2020 Intel Corporation + + Licensed under the Apache License, Version 2.0 (the "License"); + you may not use this file except in compliance with the License. + You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +""" + +import unittest + +import numpy as np + +from extensions.ops.embedding_bag import EmbeddingBagOffsetsSum, EmbeddingBagPackedSum, EmbeddingSegmentsSum +from mo.front.common.partial_infer.utils import int64_array +from mo.graph.graph import Node +from mo.utils.unittest.graph import build_graph, regular_op_with_shaped_data, valued_const_with_data, result, \ + connect, FakeAttr + +nodes = { + **valued_const_with_data('data', np.random.randn(3000, 8)), + **regular_op_with_shaped_data('indices1d', [100], {'type': 'Parameter', 'value': None, + '_out_port_data_type': {0: np.int32}}), + **regular_op_with_shaped_data('indices2d', [30, 3], {'type': 'Parameter', 'value': None, + '_out_port_data_type': {0: np.int32}}), + **regular_op_with_shaped_data('offsets', [30], {'type': 'Parameter', 'value': None, + '_out_port_data_type': {0: np.int32}}), + **regular_op_with_shaped_data('segment_ids', [100], {'type': 'Parameter', 'value': None, + '_out_port_data_type': {0: np.int32}}), + **valued_const_with_data('num_segments', np.array(30, dtype=np.int32)), + **regular_op_with_shaped_data('embedding_bag_offsets', None, + {'op': 'EmbeddingBagOffsetsSum', 'type': 'EmbeddingBagOffsetsSum', + 'name': 'embedding_bag_offsets'}), + **regular_op_with_shaped_data('embedding_bag_packed', None, + {'op': 'EmbeddingBagPackedSum', 'type': 'EmbeddingBagPackedSum', + 'name': 'embedding_bag_packed'}), + **regular_op_with_shaped_data('embedding_segments', None, + {'op': 'EmbeddingSegmentsSum', 'type': 'EmbeddingSegmentsSum', + 'name': 'embedding_bag_packed'}), + **result('output'), +} + + +class TestEmbeddingXXXInfer(unittest.TestCase): + def test_embedding_bag_offsets_sum(self): + graph = build_graph(nodes, [ + *connect('data', '0:embedding_bag_offsets'), + *connect('indices', '1:embedding_bag_offsets'), + *connect('offsets', '2:embedding_bag_offsets'), + ('embedding_bag_offsets', 'embedding_bag_offsets_d', {'out': 0}), + ('embedding_bag_offsets_d', 'output'), + ], nodes_with_edges_only=True) + eb_node = Node(graph, 'embedding_bag') + EmbeddingBagOffsetsSum.infer(eb_node) + + self.assertTrue(np.array_equal(eb_node.out_port(0).data.get_shape(), int64_array([30, 8]))) + + def test_embedding_bag_offsets_sum(self): + graph = build_graph(nodes, [ + *connect('data', '0:embedding_bag_packed'), + *connect('indices2d', '1:embedding_bag_packed'), + ('embedding_bag_packed', 'embedding_bag_packed_d', {'out': 0}), + ('embedding_bag_packed_d', 'output'), + ], nodes_with_edges_only=True) + eb_node = Node(graph, 'embedding_bag_packed') + EmbeddingBagPackedSum.infer(eb_node) + + self.assertTrue(np.array_equal(eb_node.out_port(0).data.get_shape(), int64_array([30, 8]))) + + def test_embedding_segments_sum(self): + graph = build_graph(nodes, [ + *connect('data', '0:embedding_segments'), + *connect('indices1d', '1:embedding_segments'), + *connect('segment_ids', '2:embedding_segments'), + *connect('num_segments', '3:embedding_segments'), + ('embedding_segments', 'embedding_segments_d', {'out': 0}), + ('embedding_segments_d', 'output'), + ], nodes_with_edges_only=True) + eb_node = Node(graph, 'embedding_segments') + EmbeddingSegmentsSum.infer(eb_node) + + self.assertTrue(np.array_equal(eb_node.out_port(0).data.get_shape(), int64_array([30, 8]))) From 973e9b547688ea91a0abca2e6588cf3bc6f77fbb Mon Sep 17 00:00:00 2001 From: "Maxim, Vafin" Date: Fri, 15 May 2020 14:27:23 +0300 Subject: [PATCH 08/31] Fix ATen resolver --- model-optimizer/extensions/front/ATenToEmbeddingBag.py | 3 +-- .../extensions/front/ATenToEmbeddingBag_test.py | 10 ++++------ 2 files changed, 5 insertions(+), 8 deletions(-) diff --git a/model-optimizer/extensions/front/ATenToEmbeddingBag.py b/model-optimizer/extensions/front/ATenToEmbeddingBag.py index c76cef84161068..26a6e43cfb8533 100644 --- a/model-optimizer/extensions/front/ATenToEmbeddingBag.py +++ b/model-optimizer/extensions/front/ATenToEmbeddingBag.py @@ -31,8 +31,7 @@ def find_and_replace_pattern(self, graph: Graph): 'mode is supported for node {}.'.format(node.id) node_name = node.name rename_node(node, node_name + '/Old') - indices_shape = node.in_port(1).data.get_shape() - if len(indices_shape) == 2: + if node.in_port(2).disconnected(): embedding_bag = EmbeddingBagPackedSum(graph, {'name': node_name}).create_node() per_sample_weights_port_id = 2 else: diff --git a/model-optimizer/extensions/front/ATenToEmbeddingBag_test.py b/model-optimizer/extensions/front/ATenToEmbeddingBag_test.py index 3873eee29f3f07..fc36fc7190f914 100644 --- a/model-optimizer/extensions/front/ATenToEmbeddingBag_test.py +++ b/model-optimizer/extensions/front/ATenToEmbeddingBag_test.py @@ -24,12 +24,11 @@ 'weights_inp': {'shape': None, 'type': 'Parameter', 'kind': 'op', 'op': 'Parameter'}, 'indices_inp': {'shape': None, 'type': 'Parameter', 'kind': 'op', 'op': 'Parameter'}, 'offsets_inp': {'shape': None, 'type': 'Parameter', 'kind': 'op', 'op': 'Parameter'}, - 'aten': {'type': None, 'kind': 'op', 'op': 'ATen', 'mode': 0, 'operator': 'embedding_bag', 'name': 'my_aten', - 'scale_grad_by_freq': 0}, + 'aten': {'type': None, 'kind': 'op', 'op': 'ATen', 'mode': 0, 'operator': 'embedding_bag', 'name': 'my_aten'}, 'result': {'type': 'Result', 'value': None, 'kind': 'op', 'op': 'Result'}, # new EmbeddingBag layer - 'emb_bag': {'type': None, 'kind': 'op', 'op': 'EmbeddingBag', 'mode': 0, 'scale_grad_by_freq': 0}, + 'emb_bag': {'type': 'EmbeddingBagOffsetsSum', 'kind': 'op', 'op': 'EmbeddingBagOffsetsSum'}, } @@ -54,9 +53,8 @@ def test(self): graph.graph['layout'] = 'NCHW' graph.stage = 'front' - replacer = AtenToEmbeddingBag() - replacer.find_and_replace_pattern(graph) + AtenToEmbeddingBag().find_and_replace_pattern(graph) (flag, resp) = compare_graphs(graph, graph_ref, 'result', check_op_attrs=True) self.assertTrue(flag, resp) - self.assertTrue(graph.node[graph.get_nodes_with_attributes(op='EmbeddingBag')[0]]['name'] == 'my_aten') + self.assertTrue(graph.node[graph.get_nodes_with_attributes(op='EmbeddingBagOffsetsSum')[0]]['name'] == 'my_aten') From 4bf92b25f010b5aefdbccf8d1bb13bf83e4fa576 Mon Sep 17 00:00:00 2001 From: "Maxim, Vafin" Date: Tue, 19 May 2020 22:16:50 +0300 Subject: [PATCH 09/31] Remove deleted files from BOM --- model-optimizer/automation/package_BOM.txt | 2 -- 1 file changed, 2 deletions(-) diff --git a/model-optimizer/automation/package_BOM.txt b/model-optimizer/automation/package_BOM.txt index 1c7015e4083c8b..8104d2f2e3c4d0 100644 --- a/model-optimizer/automation/package_BOM.txt +++ b/model-optimizer/automation/package_BOM.txt @@ -516,7 +516,6 @@ extensions/middle/DilatedConvolution.py extensions/middle/EltwiseChecker.py extensions/middle/EltwiseInputNormalization.py extensions/middle/EltwiseInputReshape.py -extensions/middle/EmbeddingBagResolver.py extensions/middle/FakeSplitOutputs.py extensions/middle/FusedBatchNormNonConstant.py extensions/middle/FusedBatchNormTraining.py @@ -680,7 +679,6 @@ extensions/ops/sparse_segment_mean.py extensions/ops/sparse_segment_sqrtn.py extensions/ops/sparse_segment_sum.py extensions/ops/sparse_to_dense.py -extensions/ops/sparse_weighted_sum.py extensions/ops/spatial_transformer.py extensions/ops/splice.py extensions/ops/split.py From 75b5ec421eb227cd53051c95c0c2cc6a012197db Mon Sep 17 00:00:00 2001 From: "Maxim, Vafin" Date: Wed, 20 May 2020 14:50:45 +0300 Subject: [PATCH 10/31] Add opset version to embedding_bag --- model-optimizer/extensions/front/ATenToEmbeddingBag.py | 5 ++--- model-optimizer/extensions/ops/embedding_bag.py | 4 +++- 2 files changed, 5 insertions(+), 4 deletions(-) diff --git a/model-optimizer/extensions/front/ATenToEmbeddingBag.py b/model-optimizer/extensions/front/ATenToEmbeddingBag.py index 26a6e43cfb8533..865001deb4b13f 100644 --- a/model-optimizer/extensions/front/ATenToEmbeddingBag.py +++ b/model-optimizer/extensions/front/ATenToEmbeddingBag.py @@ -27,8 +27,8 @@ class AtenToEmbeddingBag(FrontReplacementPattern): def find_and_replace_pattern(self, graph: Graph): for node in graph.get_op_nodes(op='ATen', operator='embedding_bag'): - assert node.has_valid('mode') and node.mode == 0, 'ATen::embedding_bag has unsupported mode, only "sum" ' \ - 'mode is supported for node {}.'.format(node.id) + assert node.soft_get('mode') == 0, 'ATen::embedding_bag has unsupported mode, only "sum" ' \ + 'mode is supported for node {}.'.format(node.id) node_name = node.name rename_node(node, node_name + '/Old') if node.in_port(2).disconnected(): @@ -43,4 +43,3 @@ def find_and_replace_pattern(self, graph: Graph): node.out_port(0).get_connection().set_source(embedding_bag.out_port(0)) if len(node.in_ports()) == 4 and not node.in_port(3).disconnected(): node.in_port(3).get_connection().set_destination(embedding_bag.in_port(per_sample_weights_port_id)) - diff --git a/model-optimizer/extensions/ops/embedding_bag.py b/model-optimizer/extensions/ops/embedding_bag.py index 28441e974efcf2..667e384f1b5073 100644 --- a/model-optimizer/extensions/ops/embedding_bag.py +++ b/model-optimizer/extensions/ops/embedding_bag.py @@ -14,7 +14,6 @@ limitations under the License. """ -from mo.front.common.partial_infer.utils import int64_array from mo.graph.graph import Node, Graph from mo.ops.op import Op @@ -29,6 +28,7 @@ def __init__(self, graph: Graph, attrs: dict): super().__init__(graph, { 'op': self.op, 'type': self.op, + 'version': 'opset3', 'infer': self.infer, @@ -63,6 +63,7 @@ def __init__(self, graph: Graph, attrs: dict): super().__init__(graph, { 'op': self.op, 'type': self.op, + 'version': 'opset3', 'infer': self.infer, @@ -95,6 +96,7 @@ def __init__(self, graph: Graph, attrs: dict): super().__init__(graph, { 'op': self.op, 'type': self.op, + 'version': 'opset3', 'infer': self.infer, From e9cf0fab135fe4f91c3187a7596ddf59aae0cd12 Mon Sep 17 00:00:00 2001 From: "Maxim, Vafin" Date: Wed, 20 May 2020 15:27:12 +0300 Subject: [PATCH 11/31] Use base class for EmbeddingBag --- .../extensions/ops/embedding_bag.py | 63 ++++++++----------- 1 file changed, 27 insertions(+), 36 deletions(-) diff --git a/model-optimizer/extensions/ops/embedding_bag.py b/model-optimizer/extensions/ops/embedding_bag.py index 667e384f1b5073..e5602c32054601 100644 --- a/model-optimizer/extensions/ops/embedding_bag.py +++ b/model-optimizer/extensions/ops/embedding_bag.py @@ -20,22 +20,35 @@ import numpy as np -class EmbeddingBagOffsetsSum(Op): - op = 'EmbeddingBagOffsetsSum' - enabled = True +class EmbeddingBagBase(Op): + enabled = False + + op = op_type = None + version = None + in_ports_count = None def __init__(self, graph: Graph, attrs: dict): super().__init__(graph, { 'op': self.op, - 'type': self.op, - 'version': 'opset3', + 'type': self.op_type, + 'version': self.version, 'infer': self.infer, - 'in_ports_count': 5, + 'in_ports_count': self.in_ports_count, 'out_ports_count': 1, }, attrs) + @staticmethod + def infer(node: Node): + raise NotImplementedError('Please use specialized EmbeddingBag operation class, EmbeddingBagBase is base class') + + +class EmbeddingBagOffsetsSum(EmbeddingBagBase): + op = op_type = 'EmbeddingBagOffsetsSum' + version = 'opset3' + in_ports_count = 5 + @staticmethod def infer(node: Node): name = node.soft_get('name', node.id) @@ -55,21 +68,10 @@ def infer(node: Node): node.out_port(0).data.set_shape(np.concatenate((offsets_shape[:1], weights_shape[1:])).astype(np.int64)) -class EmbeddingBagPackedSum(Op): - op = 'EmbeddingBagPackedSum' - enabled = True - - def __init__(self, graph: Graph, attrs: dict): - super().__init__(graph, { - 'op': self.op, - 'type': self.op, - 'version': 'opset3', - - 'infer': self.infer, - - 'in_ports_count': 3, - 'out_ports_count': 1, - }, attrs) +class EmbeddingBagPackedSum(EmbeddingBagBase): + op = op_type = 'EmbeddingBagPackedSum' + version = 'opset3' + in_ports_count = 3 @staticmethod def infer(node: Node): @@ -88,21 +90,10 @@ def infer(node: Node): node.out_port(0).data.set_shape(np.concatenate((input_shape[:1], weights_shape[1:])).astype(np.int64)) -class EmbeddingSegmentsSum(Op): - op = 'EmbeddingSegmentsSum' - enabled = True - - def __init__(self, graph: Graph, attrs: dict): - super().__init__(graph, { - 'op': self.op, - 'type': self.op, - 'version': 'opset3', - - 'infer': self.infer, - - 'in_ports_count': 6, - 'out_ports_count': 1, - }, attrs) +class EmbeddingSegmentsSum(EmbeddingBagBase): + op = op_type = 'EmbeddingSegmentsSum' + version = 'opset3' + in_ports_count = 6 @staticmethod def infer(node: Node): From adab635f6f1d73e1d23dac7148334846b0415297 Mon Sep 17 00:00:00 2001 From: "Maxim, Vafin" Date: Thu, 21 May 2020 14:46:59 +0300 Subject: [PATCH 12/31] Fix per_sample_weights case --- model-optimizer/automation/package_BOM.txt | 2 +- .../front/ATenToEmbeddingBag_test.py | 60 ------- .../{front => middle}/ATenToEmbeddingBag.py | 38 ++++- .../middle/ATenToEmbeddingBag_test.py | 146 ++++++++++++++++++ 4 files changed, 178 insertions(+), 68 deletions(-) delete mode 100644 model-optimizer/extensions/front/ATenToEmbeddingBag_test.py rename model-optimizer/extensions/{front => middle}/ATenToEmbeddingBag.py (51%) create mode 100644 model-optimizer/extensions/middle/ATenToEmbeddingBag_test.py diff --git a/model-optimizer/automation/package_BOM.txt b/model-optimizer/automation/package_BOM.txt index 8104d2f2e3c4d0..523bae4bcd3b86 100644 --- a/model-optimizer/automation/package_BOM.txt +++ b/model-optimizer/automation/package_BOM.txt @@ -73,7 +73,6 @@ extensions/back/TransposeToPermute.py extensions/back/UselessConcatRemoval.py extensions/front/__init__.py extensions/front/ArgMaxSqueeze.py -extensions/front/ATenToEmbeddingBag.py extensions/front/AttributedClampNormalizer.py extensions/front/AttributedGatherNormalizer.py extensions/front/AttributedPadToPad.py @@ -493,6 +492,7 @@ extensions/middle/AnchorToPriorBox.py extensions/middle/ApplyNHWCtoNCHWpermutation.py extensions/middle/ApplyPermutations.py extensions/middle/ArgMaxToTopK.py +extensions/middle/ATenToEmbeddingBag.py extensions/middle/AttributedTileNormalizer.py extensions/middle/BiasAddBroadcasting.py extensions/middle/BinarizeWeightsM1P1.py diff --git a/model-optimizer/extensions/front/ATenToEmbeddingBag_test.py b/model-optimizer/extensions/front/ATenToEmbeddingBag_test.py deleted file mode 100644 index fc36fc7190f914..00000000000000 --- a/model-optimizer/extensions/front/ATenToEmbeddingBag_test.py +++ /dev/null @@ -1,60 +0,0 @@ -""" - Copyright (C) 2020 Intel Corporation - - Licensed under the Apache License, Version 2.0 (the "License"); - you may not use this file except in compliance with the License. - You may obtain a copy of the License at - - http://www.apache.org/licenses/LICENSE-2.0 - - Unless required by applicable law or agreed to in writing, software - distributed under the License is distributed on an "AS IS" BASIS, - WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - See the License for the specific language governing permissions and - limitations under the License. -""" - -import unittest - -from extensions.front.ATenToEmbeddingBag import AtenToEmbeddingBag -from mo.utils.ir_engine.compare_graphs import compare_graphs -from mo.utils.unittest.graph import build_graph - -nodes_attributes = { - 'weights_inp': {'shape': None, 'type': 'Parameter', 'kind': 'op', 'op': 'Parameter'}, - 'indices_inp': {'shape': None, 'type': 'Parameter', 'kind': 'op', 'op': 'Parameter'}, - 'offsets_inp': {'shape': None, 'type': 'Parameter', 'kind': 'op', 'op': 'Parameter'}, - 'aten': {'type': None, 'kind': 'op', 'op': 'ATen', 'mode': 0, 'operator': 'embedding_bag', 'name': 'my_aten'}, - 'result': {'type': 'Result', 'value': None, 'kind': 'op', 'op': 'Result'}, - - # new EmbeddingBag layer - 'emb_bag': {'type': 'EmbeddingBagOffsetsSum', 'kind': 'op', 'op': 'EmbeddingBagOffsetsSum'}, -} - - -class AtenToEmbeddingBagTest(unittest.TestCase): - def test(self): - graph = build_graph(nodes_attributes, - [('weights_inp', 'aten', {'in': 0, 'out': 0}), - ('indices_inp', 'aten', {'in': 1, 'out': 0}), - ('offsets_inp', 'aten', {'in': 2, 'out': 0}), - ('aten', 'result', {'in': 0, 'out': 0}), - ], - {}, nodes_with_edges_only=True) - - graph_ref = build_graph(nodes_attributes, - [('weights_inp', 'emb_bag', {'in': 0, 'out': 0}), - ('indices_inp', 'emb_bag', {'in': 1, 'out': 0}), - ('offsets_inp', 'emb_bag', {'in': 2, 'out': 0}), - ('emb_bag', 'result', {'in': 0, 'out': 0}), - ], - {}, nodes_with_edges_only=True) - - graph.graph['layout'] = 'NCHW' - graph.stage = 'front' - - AtenToEmbeddingBag().find_and_replace_pattern(graph) - - (flag, resp) = compare_graphs(graph, graph_ref, 'result', check_op_attrs=True) - self.assertTrue(flag, resp) - self.assertTrue(graph.node[graph.get_nodes_with_attributes(op='EmbeddingBagOffsetsSum')[0]]['name'] == 'my_aten') diff --git a/model-optimizer/extensions/front/ATenToEmbeddingBag.py b/model-optimizer/extensions/middle/ATenToEmbeddingBag.py similarity index 51% rename from model-optimizer/extensions/front/ATenToEmbeddingBag.py rename to model-optimizer/extensions/middle/ATenToEmbeddingBag.py index 865001deb4b13f..a5ec75479090b1 100644 --- a/model-optimizer/extensions/front/ATenToEmbeddingBag.py +++ b/model-optimizer/extensions/middle/ATenToEmbeddingBag.py @@ -14,12 +14,18 @@ limitations under the License. """ +import numpy as np + from extensions.ops.embedding_bag import EmbeddingBagOffsetsSum, EmbeddingBagPackedSum -from mo.front.common.replacement import FrontReplacementPattern +from mo.front.common.partial_infer.utils import int64_array +from mo.front.tf.graph_utils import create_op_with_const_inputs from mo.graph.graph import Graph, rename_node +from mo.middle.replacement import MiddleReplacementPattern +from mo.ops.concat import Concat +from mo.ops.const import Const -class AtenToEmbeddingBag(FrontReplacementPattern): +class AtenToEmbeddingBag(MiddleReplacementPattern): """ Converts the ATen layer to EmbeddingBag layer. """ @@ -30,16 +36,34 @@ def find_and_replace_pattern(self, graph: Graph): assert node.soft_get('mode') == 0, 'ATen::embedding_bag has unsupported mode, only "sum" ' \ 'mode is supported for node {}.'.format(node.id) node_name = node.name - rename_node(node, node_name + '/Old') - if node.in_port(2).disconnected(): + rename_node(node, node_name + '/TBR') + is_packed = False + if len(node.in_ports()) < 3 or node.in_port(2).disconnected(): + is_packed = True embedding_bag = EmbeddingBagPackedSum(graph, {'name': node_name}).create_node() - per_sample_weights_port_id = 2 else: embedding_bag = EmbeddingBagOffsetsSum(graph, {'name': node_name}).create_node() - per_sample_weights_port_id = 3 node.in_port(2).get_connection().set_destination(embedding_bag.in_port(2)) + rename_node(embedding_bag, node_name) node.in_port(0).get_connection().set_destination(embedding_bag.in_port(0)) node.in_port(1).get_connection().set_destination(embedding_bag.in_port(1)) node.out_port(0).get_connection().set_source(embedding_bag.out_port(0)) if len(node.in_ports()) == 4 and not node.in_port(3).disconnected(): - node.in_port(3).get_connection().set_destination(embedding_bag.in_port(per_sample_weights_port_id)) + if is_packed: + node.in_port(3).get_connection().set_destination(embedding_bag.in_port(2)) + else: + # connect per_sample_weights + node.in_port(3).get_connection().set_destination(embedding_bag.in_port(4)) + + weights_shape = embedding_bag.in_port(0).data.get_shape() + + # expand embedding table with zeros + default_embeddings = np.zeros([1, weights_shape[-1]]) + weights_concat = create_op_with_const_inputs(graph, Concat, {1: default_embeddings}, + {'axis': 0, 'in_ports_count': 2}) + embedding_bag.in_port(0).get_connection().set_destination(weights_concat.in_port(0)) + weights_concat.out_port(0).connect(embedding_bag.in_port(0)) + + # point default index to expanded part of embedding table + default_index = Const(graph, {'value': int64_array(weights_shape[0])}).create_node() + default_index.out_port(0).connect(embedding_bag.in_port(3)) diff --git a/model-optimizer/extensions/middle/ATenToEmbeddingBag_test.py b/model-optimizer/extensions/middle/ATenToEmbeddingBag_test.py new file mode 100644 index 00000000000000..e7e2cab6485906 --- /dev/null +++ b/model-optimizer/extensions/middle/ATenToEmbeddingBag_test.py @@ -0,0 +1,146 @@ +""" + Copyright (C) 2020 Intel Corporation + + Licensed under the Apache License, Version 2.0 (the "License"); + you may not use this file except in compliance with the License. + You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +""" + +import unittest + +import numpy as np + +from extensions.middle.ATenToEmbeddingBag import AtenToEmbeddingBag +from mo.front.common.partial_infer.utils import int64_array +from mo.utils.ir_engine.compare_graphs import compare_graphs +from mo.utils.unittest.graph import build_graph, const, regular_op_with_shaped_data, valued_const_with_data, result, \ + connect + +nodes_attributes = { + **const('weights_inp', np.random.randn(1000, 10)), + 'indices_inp': {'shape': None, 'type': 'Parameter', 'kind': 'op', 'op': 'Parameter'}, + 'offsets_inp': {'shape': None, 'type': 'Parameter', 'kind': 'op', 'op': 'Parameter'}, + **const('per_sample_weights', np.random.randn(20)), + 'aten': {'type': None, 'kind': 'op', 'op': 'ATen', 'mode': 0, 'operator': 'embedding_bag', 'name': 'my_aten'}, + 'result': {'type': 'Result', 'value': None, 'kind': 'op', 'op': 'Result'}, + + # new EmbeddingBag layer + 'emb_bag': {'type': 'EmbeddingBagOffsetsSum', 'kind': 'op', 'op': 'EmbeddingBagOffsetsSum'}, +} + + +class AtenToEmbeddingBagTest(unittest.TestCase): + def test(self): + nodes = { + **valued_const_with_data('weights_inp', np.random.randn(100, 2)), + **regular_op_with_shaped_data('indices_inp', [20], {'type': 'Parameter'}), + **regular_op_with_shaped_data('offsets_inp', [10], {'type': 'Parameter'}), + **regular_op_with_shaped_data('aten', [10, 2], + {'type': None, 'kind': 'op', 'op': 'ATen', 'mode': 0, + 'operator': 'embedding_bag', 'name': 'my_aten'}), + + **regular_op_with_shaped_data('emb_bag', [10, 2], {'type': 'EmbeddingBagOffsetsSum', 'kind': 'op', + 'op': 'EmbeddingBagOffsetsSum'}), + **result('result'), + } + edges = [*connect('weights_inp', '0:aten'), + *connect('indices_inp', '1:aten'), + *connect('offsets_inp', '2:aten'), + *connect('aten', 'result'), + ] + graph = build_graph(nodes, edges) + + edges_ref = [*connect('weights_inp', '0:emb_bag'), + *connect('indices_inp', '1:emb_bag'), + *connect('offsets_inp', '2:emb_bag'), + *connect('emb_bag', 'result'), + ] + + graph_ref = build_graph(nodes, edges_ref) + + AtenToEmbeddingBag().find_and_replace_pattern(graph) + + (flag, resp) = compare_graphs(graph, graph_ref, 'result') + self.assertTrue(flag, resp) + + + def test_packed(self): + nodes = { + **valued_const_with_data('weights_inp', np.random.randn(100, 4)), + **regular_op_with_shaped_data('indices_inp', [10, 2], {'type': 'Parameter'}), + **regular_op_with_shaped_data('aten', [10, 4], + {'type': None, 'kind': 'op', 'op': 'ATen', 'mode': 0, + 'operator': 'embedding_bag', 'name': 'my_aten'}), + + **regular_op_with_shaped_data('emb_bag', [10, 4], {'type': 'EmbeddingBagPackedSum', 'kind': 'op', + 'op': 'EmbeddingBagPackedSum'}), + **result('result'), + } + edges = [*connect('weights_inp', '0:aten'), + *connect('indices_inp', '1:aten'), + *connect('aten', 'result'), + ] + graph = build_graph(nodes, edges) + + edges_ref = [*connect('weights_inp', '0:emb_bag'), + *connect('indices_inp', '1:emb_bag'), + *connect('emb_bag', 'result'), + ] + + graph_ref = build_graph(nodes, edges_ref) + + AtenToEmbeddingBag().find_and_replace_pattern(graph) + + (flag, resp) = compare_graphs(graph, graph_ref, 'result') + self.assertTrue(flag, resp) + + def test_per_sample_weights(self): + nodes = { + **valued_const_with_data('weights_inp', np.random.randn(100, 2)), + **regular_op_with_shaped_data('indices_inp', [20], {'type': 'Parameter'}), + **regular_op_with_shaped_data('offsets_inp', [10], {'type': 'Parameter'}), + **regular_op_with_shaped_data('per_sample_weights', [20], {'type': 'Parameter'}), + **regular_op_with_shaped_data('aten', [10, 2], + {'type': None, 'kind': 'op', 'op': 'ATen', 'mode': 0, + 'operator': 'embedding_bag', 'name': 'my_aten'}), + + **regular_op_with_shaped_data('emb_bag', [10, 2], {'type': 'EmbeddingBagOffsetsSum', 'kind': 'op', + 'op': 'EmbeddingBagOffsetsSum'}), + **valued_const_with_data('zeros', np.zeros([1, 2])), + **regular_op_with_shaped_data('concat', None, {'type': 'Concat', 'kind': 'op', 'op': 'Concat'}), + 'def_index': {'kind': 'op', 'value': int64_array(100), 'shape': None, 'type': 'Const'}, + 'def_index_d': {'kind': 'data', 'value': None, 'shape': None}, + **result('result'), + } + edges = [*connect('weights_inp', '0:aten'), + *connect('indices_inp', '1:aten'), + *connect('offsets_inp', '2:aten'), + *connect('per_sample_weights', '3:aten'), + *connect('aten', 'result'), + ] + graph = build_graph(nodes, edges) + + edges_ref = [*connect('weights_inp', '0:concat'), + *connect('zeros', '1:concat'), + *connect('concat', '0:emb_bag'), + *connect('indices_inp', '1:emb_bag'), + *connect('offsets_inp', '2:emb_bag'), + *connect('def_index', '3:emb_bag'), + *connect('per_sample_weights', '4:emb_bag'), + *connect('emb_bag', 'result'), + ] + + graph_ref = build_graph(nodes, edges_ref) + + AtenToEmbeddingBag().find_and_replace_pattern(graph) + + (flag, resp) = compare_graphs(graph, graph_ref, 'result') + self.assertTrue(flag, resp) From af14345efc6096611d2f5eb60ea55ab4901d1e45 Mon Sep 17 00:00:00 2001 From: Roman Kazantsev Date: Thu, 21 May 2020 23:39:22 +0500 Subject: [PATCH 13/31] Fix EmbeddingSegmentsSum transformation Signed-off-by: Roman Kazantsev --- .../extensions/front/tf/embedding_segments_sum.py | 8 ++++++-- .../front/tf/embedding_segments_sum_test.py | 12 ++++++++++-- 2 files changed, 16 insertions(+), 4 deletions(-) diff --git a/model-optimizer/extensions/front/tf/embedding_segments_sum.py b/model-optimizer/extensions/front/tf/embedding_segments_sum.py index 2e0d4c0e851a1f..ad96ab714fced4 100644 --- a/model-optimizer/extensions/front/tf/embedding_segments_sum.py +++ b/model-optimizer/extensions/front/tf/embedding_segments_sum.py @@ -87,6 +87,7 @@ def replace_sub_graph(self, graph: Graph, match: dict): log.debug('Found EmbeddingSegmentsSum pattern after {} with name {}'.format(sparse_fill_empty_rows.op, sparse_fill_empty_rows.name)) split_for_indices = create_op_with_const_inputs(graph, Split, {1: int64_array(1)}, {'num_splits': 2}) + squeeze_for_indices = create_op_with_const_inputs(graph, Squeeze, {1: int64_array([1])}) split_for_dense_shape = create_op_with_const_inputs(graph, Split, {1: int64_array(0)}, {'num_splits': 2}) squeeze_to_scalar = create_op_with_const_inputs(graph, Squeeze, {1: int64_array([0])}) embedding_segments_sum = EmbeddingSegmentsSum(graph, {'name': output_node_name}).create_node() @@ -98,7 +99,8 @@ def replace_sub_graph(self, graph: Graph, match: dict): greaterequal0.in_port(0).get_connection().set_destination(embedding_segments_sum.in_port(1)) # split and connect segment ids gather0_1.in_port(0).get_connection().set_destination(split_for_indices.in_port(0)) - embedding_segments_sum.in_port(2).connect(split_for_indices.out_port(0)) + squeeze_for_indices.in_port(0).connect(split_for_indices.out_port(0)) + embedding_segments_sum.in_port(2).connect(squeeze_for_indices.out_port(0)) # split and connect number of segments identity_spw.in_port(0).get_connection().set_destination(split_for_dense_shape.in_port(0)) squeeze_to_scalar.in_port(0).connect(split_for_dense_shape.out_port(0)) @@ -186,6 +188,7 @@ def replace_sub_graph(self, graph: Graph, match: dict): split_for_indices = create_op_with_const_inputs(graph, Split, {1: int64_array(1)}, {'num_splits': 2, 'name': output_node_name + '/SplitForIndices'}) + squeeze_for_indices = create_op_with_const_inputs(graph, Squeeze, {1: int64_array([1])}) split_for_dense_shape = create_op_with_const_inputs(graph, Split, {1: int64_array(0)}, {'num_splits': 2, 'name': output_node_name + '/SplitForDenseShape'}) @@ -199,7 +202,8 @@ def replace_sub_graph(self, graph: Graph, match: dict): greaterequal0.in_port(0).get_connection().set_destination(embedding_segments_sum.in_port(1)) # split and connect segment ids gather0_1.in_port(0).get_connection().set_destination(split_for_indices.in_port(0)) - embedding_segments_sum.in_port(2).connect(split_for_indices.out_port(0)) + squeeze_for_indices.in_port(0).connect(split_for_indices.out_port(0)) + embedding_segments_sum.in_port(2).connect(squeeze_for_indices.out_port(0)) # split and connect number of segments identity_spw.in_port(0).get_connection().set_destination(split_for_dense_shape.in_port(0)) squeeze_to_scalar.in_port(0).connect(split_for_dense_shape.out_port(0)) diff --git a/model-optimizer/extensions/front/tf/embedding_segments_sum_test.py b/model-optimizer/extensions/front/tf/embedding_segments_sum_test.py index 7e8aff025cf256..d4944489b73d16 100644 --- a/model-optimizer/extensions/front/tf/embedding_segments_sum_test.py +++ b/model-optimizer/extensions/front/tf/embedding_segments_sum_test.py @@ -48,6 +48,7 @@ def test1(self): 'select': {'kind': 'op', 'op': 'Select'}, 'split_for_indices': {'kind': 'op', 'op': 'Split'}, + 'squeeze_for_indices': {'kind': 'op', 'op': 'Squeeze'}, 'split_for_dense_shape': {'kind': 'op', 'op': 'Split'}, 'squeeze_to_scalar': {'kind': 'op', 'op': 'Squeeze'}, 'embedding_segments_sum': {'kind': 'op', 'op': 'EmbeddingSegmentsSum'}, @@ -55,6 +56,7 @@ def test1(self): **const('split_for_indices_axis', int64_array(1)), **const('split_for_dense_shape_axis', int64_array(0)), **const('squeeze_axis', int64_array([0])), + **const('squeeze_for_indices_axis', int64_array([1])), 'last': {'type': None, 'value': None, 'kind': 'op', 'op': 'Result'}, } @@ -93,7 +95,9 @@ def test1(self): graph_ref = build_graph(nodes_attributes, [('input_indices', 'split_for_indices', {'in': 0}), ('split_for_indices_axis', 'split_for_indices', {'in': 1}), - ('split_for_indices', 'embedding_segments_sum', {'in': 2, 'out': 0}), + ('split_for_indices', 'squeeze_for_indices', {'in': 0}), + ('squeeze_for_indices_axis', 'squeeze_for_indices', {'in': 1}), + ('squeeze_for_indices', 'embedding_segments_sum', {'in': 2, 'out': 0}), ('input_values', 'embedding_segments_sum', {'in': 1}), ('input_dense_shape', 'split_for_dense_shape', {'in': 0}), ('split_for_dense_shape_axis', 'split_for_dense_shape', {'in': 1}), @@ -135,6 +139,7 @@ def test2(self): 'select': {'kind': 'op', 'op': 'Select'}, 'split_for_indices': {'kind': 'op', 'op': 'Split'}, + 'squeeze_for_indices': {'kind': 'op', 'op': 'Squeeze'}, 'split_for_dense_shape': {'kind': 'op', 'op': 'Split'}, 'squeeze_to_scalar': {'kind': 'op', 'op': 'Squeeze'}, 'embedding_segments_sum': {'kind': 'op', 'op': 'EmbeddingSegmentsSum'}, @@ -142,6 +147,7 @@ def test2(self): **const('split_for_indices_axis', int64_array(1)), **const('split_for_dense_shape_axis', int64_array(0)), **const('squeeze_axis', int64_array([0])), + **const('squeeze_for_indices_axis', int64_array([1])), 'last': {'type': None, 'value': None, 'kind': 'op', 'op': 'Result'}, } @@ -182,7 +188,9 @@ def test2(self): graph_ref = build_graph(nodes_attributes, [('input_indices', 'split_for_indices', {'in': 0}), ('split_for_indices_axis', 'split_for_indices', {'in': 1}), - ('split_for_indices', 'embedding_segments_sum', {'in': 2, 'out': 0}), + ('split_for_indices', 'squeeze_for_indices', {'in': 0}), + ('squeeze_for_indices_axis', 'squeeze_for_indices', {'in': 1}), + ('squeeze_for_indices', 'embedding_segments_sum', {'in': 2, 'out': 0}), ('input_values', 'embedding_segments_sum', {'in': 1}), ('input_dense_shape', 'split_for_dense_shape', {'in': 0}), ('split_for_dense_shape_axis', 'split_for_dense_shape', {'in': 1}), From 0f202f99cd850583a0a66e82e5111a08959f4f88 Mon Sep 17 00:00:00 2001 From: "Maxim, Vafin" Date: Fri, 22 May 2020 11:34:43 +0300 Subject: [PATCH 14/31] Fix EmbeddingBag checks --- model-optimizer/extensions/ops/embedding_bag.py | 3 +++ model-optimizer/extensions/ops/embedding_bag_test.py | 2 +- 2 files changed, 4 insertions(+), 1 deletion(-) diff --git a/model-optimizer/extensions/ops/embedding_bag.py b/model-optimizer/extensions/ops/embedding_bag.py index e5602c32054601..1a33feb5b0d401 100644 --- a/model-optimizer/extensions/ops/embedding_bag.py +++ b/model-optimizer/extensions/ops/embedding_bag.py @@ -107,6 +107,9 @@ def infer(node: Node): weights_shape = node.in_port(0).data.get_shape() assert len(weights_shape) >= 2 + indices_shape = node.in_port(1).data.get_shape() + segment_ids = node.in_port(2).data.get_shape() + assert len(indices_shape) == 1 and len(segment_ids) == 1 and indices_shape == segment_ids num_segments = node.in_port(3).data.get_value() assert num_segments is not None, "EmbeddingSegmentsSum should have a constant num_segments provided, but it " \ "doesn't for node: `{}`.".format(name) diff --git a/model-optimizer/extensions/ops/embedding_bag_test.py b/model-optimizer/extensions/ops/embedding_bag_test.py index 4c59a0cbe3bd64..012dd7a1fd6709 100644 --- a/model-optimizer/extensions/ops/embedding_bag_test.py +++ b/model-optimizer/extensions/ops/embedding_bag_test.py @@ -48,7 +48,7 @@ } -class TestEmbeddingXXXInfer(unittest.TestCase): +class TestEmbeddingInfer(unittest.TestCase): def test_embedding_bag_offsets_sum(self): graph = build_graph(nodes, [ *connect('data', '0:embedding_bag_offsets'), From f71fc271c44106c2ceba970c2de5f70fc6d592c1 Mon Sep 17 00:00:00 2001 From: "Maxim, Vafin" Date: Mon, 25 May 2020 13:03:51 +0300 Subject: [PATCH 15/31] Fix ATen front transformation and merge conflicts --- .../extensions/front/ATenToEmbeddingBag.py | 40 ++++++ .../front/ATenToEmbeddingBag_test.py | 61 ++++++++ .../extensions/front/tf/WhereDecomposition.py | 4 +- .../front/tf/embedding_segments_sum.py | 6 +- .../extensions/middle/EmbeddingBagResolver.py | 69 +++++++++ .../middle/EmbeddingBagResolver_test.py | 133 ++++++++++++++++++ .../extensions/middle/sparse_reshape.py | 10 +- .../extensions/ops/embedding_bag.py | 24 +++- 8 files changed, 336 insertions(+), 11 deletions(-) create mode 100644 model-optimizer/extensions/front/ATenToEmbeddingBag.py create mode 100644 model-optimizer/extensions/front/ATenToEmbeddingBag_test.py create mode 100644 model-optimizer/extensions/middle/EmbeddingBagResolver.py create mode 100644 model-optimizer/extensions/middle/EmbeddingBagResolver_test.py diff --git a/model-optimizer/extensions/front/ATenToEmbeddingBag.py b/model-optimizer/extensions/front/ATenToEmbeddingBag.py new file mode 100644 index 00000000000000..769dc669ac6b04 --- /dev/null +++ b/model-optimizer/extensions/front/ATenToEmbeddingBag.py @@ -0,0 +1,40 @@ +""" + Copyright (C) 2018-2020 Intel Corporation + + Licensed under the Apache License, Version 2.0 (the "License"); + you may not use this file except in compliance with the License. + You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +""" + +from extensions.ops.embedding_bag import ATenEmbeddingBag +from mo.front.common.replacement import FrontReplacementPattern +from mo.graph.graph import Graph, rename_node + + +class AtenToEmbeddingBag(FrontReplacementPattern): + """ + Converts the ATen layer to EmbeddingBag layer. + """ + enabled = True + + def find_and_replace_pattern(self, graph: Graph): + for node in graph.get_op_nodes(op='ATen', operator='embedding_bag'): + node_name = node.name + rename_node(node, node_name + '/TBR') + embedding_bag = ATenEmbeddingBag(graph, {'name': node_name, 'mode': node.soft_get('mode', 1)}).create_node() + rename_node(embedding_bag, node_name) + node.in_port(0).get_connection().set_destination(embedding_bag.in_port(0)) + node.in_port(1).get_connection().set_destination(embedding_bag.in_port(1)) + if node.has_port('in', 2) and not node.in_port(2).disconnected(): + node.in_port(2).get_connection().set_destination(embedding_bag.in_port(2)) + if node.has_port('in', 3) and not node.in_port(3).disconnected(): + node.in_port(2).get_connection().set_destination(embedding_bag.in_port(3)) + node.out_port(0).get_connection().set_source(embedding_bag.out_port(0)) diff --git a/model-optimizer/extensions/front/ATenToEmbeddingBag_test.py b/model-optimizer/extensions/front/ATenToEmbeddingBag_test.py new file mode 100644 index 00000000000000..9783c7cd08cb35 --- /dev/null +++ b/model-optimizer/extensions/front/ATenToEmbeddingBag_test.py @@ -0,0 +1,61 @@ +""" + Copyright (C) 2020 Intel Corporation + + Licensed under the Apache License, Version 2.0 (the "License"); + you may not use this file except in compliance with the License. + You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +""" + +import unittest + +from extensions.front.ATenToEmbeddingBag import AtenToEmbeddingBag +from mo.utils.ir_engine.compare_graphs import compare_graphs +from mo.utils.unittest.graph import build_graph + +nodes_attributes = { + 'weights_inp': {'shape': None, 'type': 'Parameter', 'kind': 'op', 'op': 'Parameter'}, + 'indices_inp': {'shape': None, 'type': 'Parameter', 'kind': 'op', 'op': 'Parameter'}, + 'offsets_inp': {'shape': None, 'type': 'Parameter', 'kind': 'op', 'op': 'Parameter'}, + 'aten': {'type': None, 'kind': 'op', 'op': 'ATen', 'mode': 0, 'operator': 'embedding_bag', 'name': 'my_aten'}, + 'result': {'type': 'Result', 'value': None, 'kind': 'op', 'op': 'Result'}, + + # new EmbeddingBag layer + 'emb_bag': {'type': None, 'kind': 'op', 'op': 'ATenEmbeddingBag', 'mode': 0}, +} + + +class AtenToEmbeddingBagTest(unittest.TestCase): + def test(self): + graph = build_graph(nodes_attributes, + [('weights_inp', 'aten', {'in': 0, 'out': 0}), + ('indices_inp', 'aten', {'in': 1, 'out': 0}), + ('offsets_inp', 'aten', {'in': 2, 'out': 0}), + ('aten', 'result', {'in': 0, 'out': 0}), + ], + {}, nodes_with_edges_only=True) + + graph_ref = build_graph(nodes_attributes, + [('weights_inp', 'emb_bag', {'in': 0, 'out': 0}), + ('indices_inp', 'emb_bag', {'in': 1, 'out': 0}), + ('offsets_inp', 'emb_bag', {'in': 2, 'out': 0}), + ('emb_bag', 'result', {'in': 0, 'out': 0}), + ], + {}, nodes_with_edges_only=True) + + graph.graph['layout'] = 'NCHW' + graph.stage = 'front' + + replacer = AtenToEmbeddingBag() + replacer.find_and_replace_pattern(graph) + + (flag, resp) = compare_graphs(graph, graph_ref, 'result', check_op_attrs=True) + self.assertTrue(flag, resp) + self.assertTrue(graph.node[graph.get_nodes_with_attributes(op='ATenEmbeddingBag')[0]]['name'] == 'my_aten') diff --git a/model-optimizer/extensions/front/tf/WhereDecomposition.py b/model-optimizer/extensions/front/tf/WhereDecomposition.py index 656c015b0cf386..64c56a85ff2bd4 100644 --- a/model-optimizer/extensions/front/tf/WhereDecomposition.py +++ b/model-optimizer/extensions/front/tf/WhereDecomposition.py @@ -33,9 +33,9 @@ class WhereDecomposition(FrontReplacementOp): enabled = True def run_after(self): - from extensions.front.tf.sparse_weighted_sum import ExperimentalSparseWeightedSumFrontReplacer + from extensions.front.tf.embedding_segments_sum import EmbeddingSegmentsSumFrontReplacer from extensions.front.TransposeOrderNormalizer import TransposeOrderNormalizer - return [ExperimentalSparseWeightedSumFrontReplacer, TransposeOrderNormalizer] + return [EmbeddingSegmentsSumFrontReplacer, TransposeOrderNormalizer] def replace_op(self, graph: Graph, node: Node): node_name = node.soft_get('name', node.id) diff --git a/model-optimizer/extensions/front/tf/embedding_segments_sum.py b/model-optimizer/extensions/front/tf/embedding_segments_sum.py index ad96ab714fced4..50b3856745918f 100644 --- a/model-optimizer/extensions/front/tf/embedding_segments_sum.py +++ b/model-optimizer/extensions/front/tf/embedding_segments_sum.py @@ -84,7 +84,8 @@ def replace_sub_graph(self, graph: Graph, match: dict): gather = match['gather'] select = match['select'] output_node_name = select.soft_get('name', select.id) - log.debug('Found EmbeddingSegmentsSum pattern after {} with name {}'.format(sparse_fill_empty_rows.op, sparse_fill_empty_rows.name)) + log.debug('Found EmbeddingSegmentsSum pattern after {} with name {}'.format(sparse_fill_empty_rows.op, + sparse_fill_empty_rows.name)) split_for_indices = create_op_with_const_inputs(graph, Split, {1: int64_array(1)}, {'num_splits': 2}) squeeze_for_indices = create_op_with_const_inputs(graph, Squeeze, {1: int64_array([1])}) @@ -183,7 +184,8 @@ def replace_sub_graph(self, graph: Graph, match: dict): select = match['select'] output_node_name = select.soft_get('name', select.id) - log.debug('Found EmbeddingSegmentsSum2 pattern after {} with name {}'.format(sparse_fill_empty_rows.op, sparse_fill_empty_rows.name)) + log.debug('Found EmbeddingSegmentsSum2 pattern after {} with name {}'.format(sparse_fill_empty_rows.op, + sparse_fill_empty_rows.name)) split_for_indices = create_op_with_const_inputs(graph, Split, {1: int64_array(1)}, {'num_splits': 2, diff --git a/model-optimizer/extensions/middle/EmbeddingBagResolver.py b/model-optimizer/extensions/middle/EmbeddingBagResolver.py new file mode 100644 index 00000000000000..f92c5f60ff96f4 --- /dev/null +++ b/model-optimizer/extensions/middle/EmbeddingBagResolver.py @@ -0,0 +1,69 @@ +""" + Copyright (C) 2018-2020 Intel Corporation + + Licensed under the Apache License, Version 2.0 (the "License"); + you may not use this file except in compliance with the License. + You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +""" + +import numpy as np + +from extensions.ops.embedding_bag import EmbeddingBagOffsetsSum, EmbeddingBagPackedSum +from mo.front.common.partial_infer.utils import int64_array +from mo.front.tf.graph_utils import create_op_with_const_inputs +from mo.graph.graph import Graph, rename_node +from mo.middle.replacement import MiddleReplacementPattern +from mo.ops.concat import Concat +from mo.ops.const import Const + + +class EmbeddingBagResolver(MiddleReplacementPattern): + """ + Converts the ATenEmbeddingBag layer to correct internal EmbeddingBag layer. + """ + enabled = True + + def find_and_replace_pattern(self, graph: Graph): + for node in graph.get_op_nodes(op='ATenEmbeddingBag'): + assert node.soft_get('mode') == 0, 'ATen::embedding_bag has unsupported mode, only "sum" ' \ + 'mode is supported for node {}.'.format(node.id) + node_name = node.name + rename_node(node, node_name + '/TBR') + is_packed = False + if len(node.in_ports()) < 3 or node.in_port(2).disconnected(): + is_packed = True + embedding_bag = EmbeddingBagPackedSum(graph, {'name': node_name}).create_node() + else: + embedding_bag = EmbeddingBagOffsetsSum(graph, {'name': node_name}).create_node() + node.in_port(2).get_connection().set_destination(embedding_bag.in_port(2)) + rename_node(embedding_bag, node_name) + node.in_port(0).get_connection().set_destination(embedding_bag.in_port(0)) + node.in_port(1).get_connection().set_destination(embedding_bag.in_port(1)) + node.out_port(0).get_connection().set_source(embedding_bag.out_port(0)) + if len(node.in_ports()) == 4 and not node.in_port(3).disconnected(): + if is_packed: + node.in_port(3).get_connection().set_destination(embedding_bag.in_port(2)) + else: + # connect per_sample_weights + node.in_port(3).get_connection().set_destination(embedding_bag.in_port(4)) + + weights_shape = embedding_bag.in_port(0).data.get_shape() + + # expand embedding table with zeros + default_embeddings = np.zeros([1, weights_shape[-1]]) + weights_concat = create_op_with_const_inputs(graph, Concat, {1: default_embeddings}, + {'axis': 0, 'in_ports_count': 2}) + embedding_bag.in_port(0).get_connection().set_destination(weights_concat.in_port(0)) + weights_concat.out_port(0).connect(embedding_bag.in_port(0)) + + # point default index to expanded part of embedding table + default_index = Const(graph, {'value': int64_array(weights_shape[0])}).create_node() + default_index.out_port(0).connect(embedding_bag.in_port(3)) diff --git a/model-optimizer/extensions/middle/EmbeddingBagResolver_test.py b/model-optimizer/extensions/middle/EmbeddingBagResolver_test.py new file mode 100644 index 00000000000000..d964da69ccd1e0 --- /dev/null +++ b/model-optimizer/extensions/middle/EmbeddingBagResolver_test.py @@ -0,0 +1,133 @@ +""" + Copyright (C) 2020 Intel Corporation + + Licensed under the Apache License, Version 2.0 (the "License"); + you may not use this file except in compliance with the License. + You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +""" + +import unittest + +import numpy as np + +from extensions.middle.EmbeddingBagResolver import EmbeddingBagResolver +from mo.front.common.partial_infer.utils import int64_array +from mo.utils.ir_engine.compare_graphs import compare_graphs +from mo.utils.unittest.graph import build_graph, regular_op_with_shaped_data, valued_const_with_data, result, \ + connect + + +class AtenToEmbeddingBagTest(unittest.TestCase): + def test(self): + nodes = { + **valued_const_with_data('weights_inp', np.random.randn(100, 2)), + **regular_op_with_shaped_data('indices_inp', [20], {'type': 'Parameter'}), + **regular_op_with_shaped_data('offsets_inp', [10], {'type': 'Parameter'}), + **regular_op_with_shaped_data('aten', [10, 2], + {'type': None, 'kind': 'op', 'op': 'ATenEmbeddingBag', 'mode': 0, + 'name': 'my_aten'}), + + **regular_op_with_shaped_data('emb_bag', [10, 2], {'type': 'EmbeddingBagOffsetsSum', 'kind': 'op', + 'op': 'EmbeddingBagOffsetsSum'}), + **result('result'), + } + edges = [*connect('weights_inp', '0:aten'), + *connect('indices_inp', '1:aten'), + *connect('offsets_inp', '2:aten'), + *connect('aten', 'result'), + ] + graph = build_graph(nodes, edges) + + edges_ref = [*connect('weights_inp', '0:emb_bag'), + *connect('indices_inp', '1:emb_bag'), + *connect('offsets_inp', '2:emb_bag'), + *connect('emb_bag', 'result'), + ] + + graph_ref = build_graph(nodes, edges_ref) + + EmbeddingBagResolver().find_and_replace_pattern(graph) + + (flag, resp) = compare_graphs(graph, graph_ref, 'result') + self.assertTrue(flag, resp) + + def test_packed(self): + nodes = { + **valued_const_with_data('weights_inp', np.random.randn(100, 4)), + **regular_op_with_shaped_data('indices_inp', [10, 2], {'type': 'Parameter'}), + **regular_op_with_shaped_data('aten', [10, 4], + {'type': None, 'kind': 'op', 'op': 'ATenEmbeddingBag', 'mode': 0, + 'name': 'my_aten'}), + + **regular_op_with_shaped_data('emb_bag', [10, 4], {'type': 'EmbeddingBagPackedSum', 'kind': 'op', + 'op': 'EmbeddingBagPackedSum'}), + **result('result'), + } + edges = [*connect('weights_inp', '0:aten'), + *connect('indices_inp', '1:aten'), + *connect('aten', 'result'), + ] + graph = build_graph(nodes, edges) + + edges_ref = [*connect('weights_inp', '0:emb_bag'), + *connect('indices_inp', '1:emb_bag'), + *connect('emb_bag', 'result'), + ] + + graph_ref = build_graph(nodes, edges_ref) + + EmbeddingBagResolver().find_and_replace_pattern(graph) + + (flag, resp) = compare_graphs(graph, graph_ref, 'result') + self.assertTrue(flag, resp) + + def test_per_sample_weights(self): + nodes = { + **valued_const_with_data('weights_inp', np.random.randn(100, 2)), + **regular_op_with_shaped_data('indices_inp', [20], {'type': 'Parameter'}), + **regular_op_with_shaped_data('offsets_inp', [10], {'type': 'Parameter'}), + **regular_op_with_shaped_data('per_sample_weights', [20], {'type': 'Parameter'}), + **regular_op_with_shaped_data('aten', [10, 2], + {'type': None, 'kind': 'op', 'op': 'ATenEmbeddingBag', 'mode': 0, + 'name': 'my_aten'}), + + **regular_op_with_shaped_data('emb_bag', [10, 2], {'type': 'EmbeddingBagOffsetsSum', 'kind': 'op', + 'op': 'EmbeddingBagOffsetsSum'}), + **valued_const_with_data('zeros', np.zeros([1, 2])), + **regular_op_with_shaped_data('concat', None, {'type': 'Concat', 'kind': 'op', 'op': 'Concat'}), + 'def_index': {'kind': 'op', 'value': int64_array(100), 'shape': None, 'type': 'Const'}, + 'def_index_d': {'kind': 'data', 'value': None, 'shape': None}, + **result('result'), + } + edges = [*connect('weights_inp', '0:aten'), + *connect('indices_inp', '1:aten'), + *connect('offsets_inp', '2:aten'), + *connect('per_sample_weights', '3:aten'), + *connect('aten', 'result'), + ] + graph = build_graph(nodes, edges) + + edges_ref = [*connect('weights_inp', '0:concat'), + *connect('zeros', '1:concat'), + *connect('concat', '0:emb_bag'), + *connect('indices_inp', '1:emb_bag'), + *connect('offsets_inp', '2:emb_bag'), + *connect('def_index', '3:emb_bag'), + *connect('per_sample_weights', '4:emb_bag'), + *connect('emb_bag', 'result'), + ] + + graph_ref = build_graph(nodes, edges_ref) + + EmbeddingBagResolver().find_and_replace_pattern(graph) + + (flag, resp) = compare_graphs(graph, graph_ref, 'result') + self.assertTrue(flag, resp) diff --git a/model-optimizer/extensions/middle/sparse_reshape.py b/model-optimizer/extensions/middle/sparse_reshape.py index f4670e3992c6a1..3282049fd1292f 100644 --- a/model-optimizer/extensions/middle/sparse_reshape.py +++ b/model-optimizer/extensions/middle/sparse_reshape.py @@ -74,8 +74,8 @@ def replace_pattern(self, graph: Graph, match: dict): graph.remove_nodes_from([sparse_reshape.id, input_data_node1.id, input_data_node2.id]) # TODO: investigate why this second way does not work - #sparse_reshape.out_port(0).get_connection().set_source(sparse_reshape.in_port(0).get_source()) - #sparse_reshape.out_port(1).get_connection().set_source(sparse_reshape.in_port(1).get_source()) - #sparse_reshape.in_port(0).get_connection().set_destination(sparse_reshape.in_port(0) - #sparse_reshape.in_port(2).disconnect() - #graph.remove_nodes_from([sparse_reshape.id]) + # sparse_reshape.out_port(0).get_connection().set_source(sparse_reshape.in_port(0).get_source()) + # sparse_reshape.out_port(1).get_connection().set_source(sparse_reshape.in_port(1).get_source()) + # sparse_reshape.in_port(0).get_connection().set_destination(sparse_reshape.in_port(0) + # sparse_reshape.in_port(2).disconnect() + # graph.remove_nodes_from([sparse_reshape.id]) diff --git a/model-optimizer/extensions/ops/embedding_bag.py b/model-optimizer/extensions/ops/embedding_bag.py index 1a33feb5b0d401..fc13dde08ae060 100644 --- a/model-optimizer/extensions/ops/embedding_bag.py +++ b/model-optimizer/extensions/ops/embedding_bag.py @@ -14,11 +14,11 @@ limitations under the License. """ +import numpy as np + from mo.graph.graph import Node, Graph from mo.ops.op import Op -import numpy as np - class EmbeddingBagBase(Op): enabled = False @@ -115,3 +115,23 @@ def infer(node: Node): "doesn't for node: `{}`.".format(name) output_shape = np.concatenate(([num_segments], weights_shape[1:])).astype(np.int64) node.out_port(0).data.set_shape(output_shape) + + +class ATenEmbeddingBag(EmbeddingBagBase): + op = 'ATenEmbeddingBag' + op_type = None + version = None + in_ports_count = 4 + + @staticmethod + def infer(node: Node): + weights_shape = node.in_port(0).data.get_shape() + assert len(weights_shape) >= 2 + indices_shape = node.in_port(1).data.get_shape() + assert indices_shape is not None + if len(indices_shape) == 2: + node.out_port(0).data.set_shape(np.concatenate((indices_shape[:1], weights_shape[1:])).astype(np.int64)) + elif len(indices_shape) == 1: + offsets_shape = node.in_port(2).data.get_shape() + assert offsets_shape is not None and len(offsets_shape) == 1 + node.out_port(0).data.set_shape(np.concatenate((offsets_shape[:1], weights_shape[1:])).astype(np.int64)) From c6ceb77a1e0ebf86c8f4f19f3289fa75efa402ee Mon Sep 17 00:00:00 2001 From: "Maxim, Vafin" Date: Tue, 26 May 2020 11:59:54 +0300 Subject: [PATCH 16/31] Fix BOM --- model-optimizer/automation/package_BOM.txt | 2 +- .../extensions/middle/ATenToEmbeddingBag.py | 69 --------- .../middle/ATenToEmbeddingBag_test.py | 146 ------------------ 3 files changed, 1 insertion(+), 216 deletions(-) delete mode 100644 model-optimizer/extensions/middle/ATenToEmbeddingBag.py delete mode 100644 model-optimizer/extensions/middle/ATenToEmbeddingBag_test.py diff --git a/model-optimizer/automation/package_BOM.txt b/model-optimizer/automation/package_BOM.txt index 523bae4bcd3b86..e51152bb6ccb5c 100644 --- a/model-optimizer/automation/package_BOM.txt +++ b/model-optimizer/automation/package_BOM.txt @@ -492,7 +492,6 @@ extensions/middle/AnchorToPriorBox.py extensions/middle/ApplyNHWCtoNCHWpermutation.py extensions/middle/ApplyPermutations.py extensions/middle/ArgMaxToTopK.py -extensions/middle/ATenToEmbeddingBag.py extensions/middle/AttributedTileNormalizer.py extensions/middle/BiasAddBroadcasting.py extensions/middle/BinarizeWeightsM1P1.py @@ -516,6 +515,7 @@ extensions/middle/DilatedConvolution.py extensions/middle/EltwiseChecker.py extensions/middle/EltwiseInputNormalization.py extensions/middle/EltwiseInputReshape.py +extensions/middle/EmbeddingBagResolver.py extensions/middle/FakeSplitOutputs.py extensions/middle/FusedBatchNormNonConstant.py extensions/middle/FusedBatchNormTraining.py diff --git a/model-optimizer/extensions/middle/ATenToEmbeddingBag.py b/model-optimizer/extensions/middle/ATenToEmbeddingBag.py deleted file mode 100644 index a5ec75479090b1..00000000000000 --- a/model-optimizer/extensions/middle/ATenToEmbeddingBag.py +++ /dev/null @@ -1,69 +0,0 @@ -""" - Copyright (C) 2018-2020 Intel Corporation - - Licensed under the Apache License, Version 2.0 (the "License"); - you may not use this file except in compliance with the License. - You may obtain a copy of the License at - - http://www.apache.org/licenses/LICENSE-2.0 - - Unless required by applicable law or agreed to in writing, software - distributed under the License is distributed on an "AS IS" BASIS, - WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - See the License for the specific language governing permissions and - limitations under the License. -""" - -import numpy as np - -from extensions.ops.embedding_bag import EmbeddingBagOffsetsSum, EmbeddingBagPackedSum -from mo.front.common.partial_infer.utils import int64_array -from mo.front.tf.graph_utils import create_op_with_const_inputs -from mo.graph.graph import Graph, rename_node -from mo.middle.replacement import MiddleReplacementPattern -from mo.ops.concat import Concat -from mo.ops.const import Const - - -class AtenToEmbeddingBag(MiddleReplacementPattern): - """ - Converts the ATen layer to EmbeddingBag layer. - """ - enabled = True - - def find_and_replace_pattern(self, graph: Graph): - for node in graph.get_op_nodes(op='ATen', operator='embedding_bag'): - assert node.soft_get('mode') == 0, 'ATen::embedding_bag has unsupported mode, only "sum" ' \ - 'mode is supported for node {}.'.format(node.id) - node_name = node.name - rename_node(node, node_name + '/TBR') - is_packed = False - if len(node.in_ports()) < 3 or node.in_port(2).disconnected(): - is_packed = True - embedding_bag = EmbeddingBagPackedSum(graph, {'name': node_name}).create_node() - else: - embedding_bag = EmbeddingBagOffsetsSum(graph, {'name': node_name}).create_node() - node.in_port(2).get_connection().set_destination(embedding_bag.in_port(2)) - rename_node(embedding_bag, node_name) - node.in_port(0).get_connection().set_destination(embedding_bag.in_port(0)) - node.in_port(1).get_connection().set_destination(embedding_bag.in_port(1)) - node.out_port(0).get_connection().set_source(embedding_bag.out_port(0)) - if len(node.in_ports()) == 4 and not node.in_port(3).disconnected(): - if is_packed: - node.in_port(3).get_connection().set_destination(embedding_bag.in_port(2)) - else: - # connect per_sample_weights - node.in_port(3).get_connection().set_destination(embedding_bag.in_port(4)) - - weights_shape = embedding_bag.in_port(0).data.get_shape() - - # expand embedding table with zeros - default_embeddings = np.zeros([1, weights_shape[-1]]) - weights_concat = create_op_with_const_inputs(graph, Concat, {1: default_embeddings}, - {'axis': 0, 'in_ports_count': 2}) - embedding_bag.in_port(0).get_connection().set_destination(weights_concat.in_port(0)) - weights_concat.out_port(0).connect(embedding_bag.in_port(0)) - - # point default index to expanded part of embedding table - default_index = Const(graph, {'value': int64_array(weights_shape[0])}).create_node() - default_index.out_port(0).connect(embedding_bag.in_port(3)) diff --git a/model-optimizer/extensions/middle/ATenToEmbeddingBag_test.py b/model-optimizer/extensions/middle/ATenToEmbeddingBag_test.py deleted file mode 100644 index e7e2cab6485906..00000000000000 --- a/model-optimizer/extensions/middle/ATenToEmbeddingBag_test.py +++ /dev/null @@ -1,146 +0,0 @@ -""" - Copyright (C) 2020 Intel Corporation - - Licensed under the Apache License, Version 2.0 (the "License"); - you may not use this file except in compliance with the License. - You may obtain a copy of the License at - - http://www.apache.org/licenses/LICENSE-2.0 - - Unless required by applicable law or agreed to in writing, software - distributed under the License is distributed on an "AS IS" BASIS, - WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - See the License for the specific language governing permissions and - limitations under the License. -""" - -import unittest - -import numpy as np - -from extensions.middle.ATenToEmbeddingBag import AtenToEmbeddingBag -from mo.front.common.partial_infer.utils import int64_array -from mo.utils.ir_engine.compare_graphs import compare_graphs -from mo.utils.unittest.graph import build_graph, const, regular_op_with_shaped_data, valued_const_with_data, result, \ - connect - -nodes_attributes = { - **const('weights_inp', np.random.randn(1000, 10)), - 'indices_inp': {'shape': None, 'type': 'Parameter', 'kind': 'op', 'op': 'Parameter'}, - 'offsets_inp': {'shape': None, 'type': 'Parameter', 'kind': 'op', 'op': 'Parameter'}, - **const('per_sample_weights', np.random.randn(20)), - 'aten': {'type': None, 'kind': 'op', 'op': 'ATen', 'mode': 0, 'operator': 'embedding_bag', 'name': 'my_aten'}, - 'result': {'type': 'Result', 'value': None, 'kind': 'op', 'op': 'Result'}, - - # new EmbeddingBag layer - 'emb_bag': {'type': 'EmbeddingBagOffsetsSum', 'kind': 'op', 'op': 'EmbeddingBagOffsetsSum'}, -} - - -class AtenToEmbeddingBagTest(unittest.TestCase): - def test(self): - nodes = { - **valued_const_with_data('weights_inp', np.random.randn(100, 2)), - **regular_op_with_shaped_data('indices_inp', [20], {'type': 'Parameter'}), - **regular_op_with_shaped_data('offsets_inp', [10], {'type': 'Parameter'}), - **regular_op_with_shaped_data('aten', [10, 2], - {'type': None, 'kind': 'op', 'op': 'ATen', 'mode': 0, - 'operator': 'embedding_bag', 'name': 'my_aten'}), - - **regular_op_with_shaped_data('emb_bag', [10, 2], {'type': 'EmbeddingBagOffsetsSum', 'kind': 'op', - 'op': 'EmbeddingBagOffsetsSum'}), - **result('result'), - } - edges = [*connect('weights_inp', '0:aten'), - *connect('indices_inp', '1:aten'), - *connect('offsets_inp', '2:aten'), - *connect('aten', 'result'), - ] - graph = build_graph(nodes, edges) - - edges_ref = [*connect('weights_inp', '0:emb_bag'), - *connect('indices_inp', '1:emb_bag'), - *connect('offsets_inp', '2:emb_bag'), - *connect('emb_bag', 'result'), - ] - - graph_ref = build_graph(nodes, edges_ref) - - AtenToEmbeddingBag().find_and_replace_pattern(graph) - - (flag, resp) = compare_graphs(graph, graph_ref, 'result') - self.assertTrue(flag, resp) - - - def test_packed(self): - nodes = { - **valued_const_with_data('weights_inp', np.random.randn(100, 4)), - **regular_op_with_shaped_data('indices_inp', [10, 2], {'type': 'Parameter'}), - **regular_op_with_shaped_data('aten', [10, 4], - {'type': None, 'kind': 'op', 'op': 'ATen', 'mode': 0, - 'operator': 'embedding_bag', 'name': 'my_aten'}), - - **regular_op_with_shaped_data('emb_bag', [10, 4], {'type': 'EmbeddingBagPackedSum', 'kind': 'op', - 'op': 'EmbeddingBagPackedSum'}), - **result('result'), - } - edges = [*connect('weights_inp', '0:aten'), - *connect('indices_inp', '1:aten'), - *connect('aten', 'result'), - ] - graph = build_graph(nodes, edges) - - edges_ref = [*connect('weights_inp', '0:emb_bag'), - *connect('indices_inp', '1:emb_bag'), - *connect('emb_bag', 'result'), - ] - - graph_ref = build_graph(nodes, edges_ref) - - AtenToEmbeddingBag().find_and_replace_pattern(graph) - - (flag, resp) = compare_graphs(graph, graph_ref, 'result') - self.assertTrue(flag, resp) - - def test_per_sample_weights(self): - nodes = { - **valued_const_with_data('weights_inp', np.random.randn(100, 2)), - **regular_op_with_shaped_data('indices_inp', [20], {'type': 'Parameter'}), - **regular_op_with_shaped_data('offsets_inp', [10], {'type': 'Parameter'}), - **regular_op_with_shaped_data('per_sample_weights', [20], {'type': 'Parameter'}), - **regular_op_with_shaped_data('aten', [10, 2], - {'type': None, 'kind': 'op', 'op': 'ATen', 'mode': 0, - 'operator': 'embedding_bag', 'name': 'my_aten'}), - - **regular_op_with_shaped_data('emb_bag', [10, 2], {'type': 'EmbeddingBagOffsetsSum', 'kind': 'op', - 'op': 'EmbeddingBagOffsetsSum'}), - **valued_const_with_data('zeros', np.zeros([1, 2])), - **regular_op_with_shaped_data('concat', None, {'type': 'Concat', 'kind': 'op', 'op': 'Concat'}), - 'def_index': {'kind': 'op', 'value': int64_array(100), 'shape': None, 'type': 'Const'}, - 'def_index_d': {'kind': 'data', 'value': None, 'shape': None}, - **result('result'), - } - edges = [*connect('weights_inp', '0:aten'), - *connect('indices_inp', '1:aten'), - *connect('offsets_inp', '2:aten'), - *connect('per_sample_weights', '3:aten'), - *connect('aten', 'result'), - ] - graph = build_graph(nodes, edges) - - edges_ref = [*connect('weights_inp', '0:concat'), - *connect('zeros', '1:concat'), - *connect('concat', '0:emb_bag'), - *connect('indices_inp', '1:emb_bag'), - *connect('offsets_inp', '2:emb_bag'), - *connect('def_index', '3:emb_bag'), - *connect('per_sample_weights', '4:emb_bag'), - *connect('emb_bag', 'result'), - ] - - graph_ref = build_graph(nodes, edges_ref) - - AtenToEmbeddingBag().find_and_replace_pattern(graph) - - (flag, resp) = compare_graphs(graph, graph_ref, 'result') - self.assertTrue(flag, resp) From ab67e0e36618ca11949c5f59c48cd99b5d879428 Mon Sep 17 00:00:00 2001 From: Roman Kazantsev Date: Sun, 31 May 2020 13:36:41 +0500 Subject: [PATCH 17/31] Work around limitation for I64 input of W&D model Signed-off-by: Roman Kazantsev --- .../extensions/front/tf/WhereDecomposition.py | 4 ++-- .../front/tf/embedding_segments_sum.py | 24 +++++++++++++++---- .../front/tf/embedding_segments_sum_test.py | 16 +++++++++---- 3 files changed, 34 insertions(+), 10 deletions(-) diff --git a/model-optimizer/extensions/front/tf/WhereDecomposition.py b/model-optimizer/extensions/front/tf/WhereDecomposition.py index 64c56a85ff2bd4..a8e513be399f5c 100644 --- a/model-optimizer/extensions/front/tf/WhereDecomposition.py +++ b/model-optimizer/extensions/front/tf/WhereDecomposition.py @@ -33,9 +33,9 @@ class WhereDecomposition(FrontReplacementOp): enabled = True def run_after(self): - from extensions.front.tf.embedding_segments_sum import EmbeddingSegmentsSumFrontReplacer + from extensions.front.tf.embedding_segments_sum import EmbeddingSegmentsSumFrontReplacer, EmbeddingSegmentsSumFrontReplacer2 from extensions.front.TransposeOrderNormalizer import TransposeOrderNormalizer - return [EmbeddingSegmentsSumFrontReplacer, TransposeOrderNormalizer] + return [EmbeddingSegmentsSumFrontReplacer, EmbeddingSegmentsSumFrontReplacer2, TransposeOrderNormalizer] def replace_op(self, graph: Graph, node: Node): node_name = node.soft_get('name', node.id) diff --git a/model-optimizer/extensions/front/tf/embedding_segments_sum.py b/model-optimizer/extensions/front/tf/embedding_segments_sum.py index 50b3856745918f..1a9482122a260a 100644 --- a/model-optimizer/extensions/front/tf/embedding_segments_sum.py +++ b/model-optimizer/extensions/front/tf/embedding_segments_sum.py @@ -15,7 +15,9 @@ """ import logging as log +import numpy as np +from extensions.ops.Cast import Cast from extensions.ops.embedding_bag import EmbeddingSegmentsSum from extensions.ops.split import Split from mo.front.common.partial_infer.utils import int64_array @@ -32,6 +34,7 @@ class EmbeddingSegmentsSumFrontReplacer(FrontReplacementSubgraph): Such sub-graph is met in the Wide and Deep model in case of the SINGLE categorical feature. """ enabled = True + force_clean_up = True def pattern(self): log.debug('Enabled EmbeddingSegmentsSum replacement') @@ -91,6 +94,8 @@ def replace_sub_graph(self, graph: Graph, match: dict): squeeze_for_indices = create_op_with_const_inputs(graph, Squeeze, {1: int64_array([1])}) split_for_dense_shape = create_op_with_const_inputs(graph, Split, {1: int64_array(0)}, {'num_splits': 2}) squeeze_to_scalar = create_op_with_const_inputs(graph, Squeeze, {1: int64_array([0])}) + cast_default_value = Cast(graph, {'name': output_node_name + '/CastDefaultValue', 'dst_type': np.int32}).create_node() + cast_num_segments = Cast(graph, {'name': output_node_name + '/CastSegmentsNumber', 'dst_type': np.int32}).create_node() embedding_segments_sum = EmbeddingSegmentsSum(graph, {'name': output_node_name}).create_node() rename_nodes([(select, output_node_name + '/AbandonedName'), (embedding_segments_sum, output_node_name)]) @@ -105,9 +110,13 @@ def replace_sub_graph(self, graph: Graph, match: dict): # split and connect number of segments identity_spw.in_port(0).get_connection().set_destination(split_for_dense_shape.in_port(0)) squeeze_to_scalar.in_port(0).connect(split_for_dense_shape.out_port(0)) - embedding_segments_sum.in_port(3).connect(squeeze_to_scalar.out_port(0)) + # TODO: remove casting once we start to support I64 model input + cast_num_segments.in_port(0).connect(squeeze_to_scalar.out_port(0)) + embedding_segments_sum.in_port(3).connect(cast_num_segments.out_port(0)) # connect default value - sparse_fill_empty_rows.in_port(3).get_connection().set_destination(embedding_segments_sum.in_port(4)) + # TODO: remove casting once we start to support I64 model input + sparse_fill_empty_rows.in_port(3).get_connection().set_destination(cast_default_value.in_port(0)) + embedding_segments_sum.in_port(4).connect(cast_default_value.out_port(0)) # no input port for per_sample_weight identity_spw.in_port(0).disconnect() @@ -128,6 +137,7 @@ class EmbeddingSegmentsSumFrontReplacer2(FrontReplacementSubgraph): Such sub-graph is met in the Wide and Deep model in case of MULTIPLE categorical features. """ enabled = True + force_clean_up = True def pattern(self): log.debug('Enabled EmbeddingSegmentsSum2 replacement') @@ -195,6 +205,8 @@ def replace_sub_graph(self, graph: Graph, match: dict): {'num_splits': 2, 'name': output_node_name + '/SplitForDenseShape'}) squeeze_to_scalar = create_op_with_const_inputs(graph, Squeeze, {1: int64_array([0])}) + cast_default_value = Cast(graph, {'name': output_node_name + '/CastDefaultValue', 'dst_type': np.int32}).create_node() + cast_num_segments = Cast(graph, {'name': output_node_name + '/CastSegmentsNumber', 'dst_type': np.int32}).create_node() embedding_segments_sum = EmbeddingSegmentsSum(graph, {'name': output_node_name}).create_node() rename_nodes([(select, output_node_name + '/AbandonedName'), (embedding_segments_sum, output_node_name)]) @@ -209,9 +221,13 @@ def replace_sub_graph(self, graph: Graph, match: dict): # split and connect number of segments identity_spw.in_port(0).get_connection().set_destination(split_for_dense_shape.in_port(0)) squeeze_to_scalar.in_port(0).connect(split_for_dense_shape.out_port(0)) - embedding_segments_sum.in_port(3).connect(squeeze_to_scalar.out_port(0)) + # TODO: remove casting once we start to support I64 model input + cast_num_segments.in_port(0).connect(squeeze_to_scalar.out_port(0)) + embedding_segments_sum.in_port(3).connect(cast_num_segments.out_port(0)) # connect default value - sparse_fill_empty_rows.in_port(3).get_connection().set_destination(embedding_segments_sum.in_port(4)) + # TODO: remove casting once we start to support I64 model input + sparse_fill_empty_rows.in_port(3).get_connection().set_destination(cast_default_value.in_port(0)) + embedding_segments_sum.in_port(4).connect(cast_default_value.out_port(0)) # no input port for per_sample_weight identity_spw.in_port(0).disconnect() diff --git a/model-optimizer/extensions/front/tf/embedding_segments_sum_test.py b/model-optimizer/extensions/front/tf/embedding_segments_sum_test.py index d4944489b73d16..0b28dead6315ce 100644 --- a/model-optimizer/extensions/front/tf/embedding_segments_sum_test.py +++ b/model-optimizer/extensions/front/tf/embedding_segments_sum_test.py @@ -51,6 +51,8 @@ def test1(self): 'squeeze_for_indices': {'kind': 'op', 'op': 'Squeeze'}, 'split_for_dense_shape': {'kind': 'op', 'op': 'Split'}, 'squeeze_to_scalar': {'kind': 'op', 'op': 'Squeeze'}, + 'cast_default_value': {'kind': 'op', 'op': 'Cast'}, + 'cast_number_segments': {'kind': 'op', 'op': 'Cast'}, 'embedding_segments_sum': {'kind': 'op', 'op': 'EmbeddingSegmentsSum'}, **const('split_for_indices_axis', int64_array(1)), @@ -103,9 +105,11 @@ def test1(self): ('split_for_dense_shape_axis', 'split_for_dense_shape', {'in': 1}), ('split_for_dense_shape', 'squeeze_to_scalar', {'in': 0}), ('squeeze_axis', 'squeeze_to_scalar', {'in': 1}), - ('squeeze_to_scalar', 'embedding_segments_sum', {'in': 3, 'out': 0}), + ('squeeze_to_scalar', 'cast_number_segments', {'in': 0}), + ('cast_number_segments', 'embedding_segments_sum', {'in': 3, 'out': 0}), ('input_params_table', 'embedding_segments_sum', {'in': 0}), - ('input_default_value', 'embedding_segments_sum', {'in': 4}), + ('input_default_value', 'cast_default_value', {'in': 0}), + ('cast_default_value', 'embedding_segments_sum', {'in': 4}), ('embedding_segments_sum', 'last', {'in': 0}),], nodes_with_edges_only=True) @@ -142,6 +146,8 @@ def test2(self): 'squeeze_for_indices': {'kind': 'op', 'op': 'Squeeze'}, 'split_for_dense_shape': {'kind': 'op', 'op': 'Split'}, 'squeeze_to_scalar': {'kind': 'op', 'op': 'Squeeze'}, + 'cast_default_value': {'kind': 'op', 'op': 'Cast'}, + 'cast_number_segments': {'kind': 'op', 'op': 'Cast'}, 'embedding_segments_sum': {'kind': 'op', 'op': 'EmbeddingSegmentsSum'}, **const('split_for_indices_axis', int64_array(1)), @@ -196,9 +202,11 @@ def test2(self): ('split_for_dense_shape_axis', 'split_for_dense_shape', {'in': 1}), ('split_for_dense_shape', 'squeeze_to_scalar', {'in': 0}), ('squeeze_axis', 'squeeze_to_scalar', {'in': 1}), - ('squeeze_to_scalar', 'embedding_segments_sum', {'in': 3, 'out': 0}), + ('squeeze_to_scalar', 'cast_number_segments', {'in': 0}), + ('cast_number_segments', 'embedding_segments_sum', {'in': 3, 'out': 0}), ('input_params_table', 'embedding_segments_sum', {'in': 0}), - ('input_default_value', 'embedding_segments_sum', {'in': 4}), + ('input_default_value', 'cast_default_value', {'in': 0}), + ('cast_default_value', 'embedding_segments_sum', {'in': 4}), ('embedding_segments_sum', 'last', {'in': 0}),], nodes_with_edges_only=True) From 3b9ae651e6cbbb1e1523707f295ae518450568c2 Mon Sep 17 00:00:00 2001 From: Roman Kazantsev Date: Mon, 1 Jun 2020 12:00:57 +0500 Subject: [PATCH 18/31] Cleanup where operation to fix affect of WhereDecomposition transform Signed-off-by: Roman Kazantsev --- .../extensions/front/tf/embedding_segments_sum.py | 10 +++++----- 1 file changed, 5 insertions(+), 5 deletions(-) diff --git a/model-optimizer/extensions/front/tf/embedding_segments_sum.py b/model-optimizer/extensions/front/tf/embedding_segments_sum.py index 1a9482122a260a..eee59e119ed12f 100644 --- a/model-optimizer/extensions/front/tf/embedding_segments_sum.py +++ b/model-optimizer/extensions/front/tf/embedding_segments_sum.py @@ -34,7 +34,6 @@ class EmbeddingSegmentsSumFrontReplacer(FrontReplacementSubgraph): Such sub-graph is met in the Wide and Deep model in case of the SINGLE categorical feature. """ enabled = True - force_clean_up = True def pattern(self): log.debug('Enabled EmbeddingSegmentsSum replacement') @@ -83,10 +82,11 @@ def replace_sub_graph(self, graph: Graph, match: dict): gather0_2 = match['gather0_2'] greaterequal0 = match['greaterequal0'] sparse_fill_empty_rows = match['sparse_fill_empty_rows'] - gather = match['gather'] select = match['select'] + where0 = match['where0'] output_node_name = select.soft_get('name', select.id) + log.debug('Found EmbeddingSegmentsSum pattern after {} with name {}'.format(sparse_fill_empty_rows.op, sparse_fill_empty_rows.name)) @@ -127,7 +127,7 @@ def replace_sub_graph(self, graph: Graph, match: dict): gather.in_port(0).disconnect() select.out_port(0).get_connection().set_source(embedding_segments_sum.out_port(0)) - graph.remove_nodes_from([gather0_1.id, gather0_2.id, greaterequal0.id, sparse_fill_empty_rows.id, select.id]) + graph.remove_nodes_from([gather0_1.id, gather0_2.id, greaterequal0.id, sparse_fill_empty_rows.id, select.id, where0.id]) class EmbeddingSegmentsSumFrontReplacer2(FrontReplacementSubgraph): @@ -137,7 +137,6 @@ class EmbeddingSegmentsSumFrontReplacer2(FrontReplacementSubgraph): Such sub-graph is met in the Wide and Deep model in case of MULTIPLE categorical features. """ enabled = True - force_clean_up = True def pattern(self): log.debug('Enabled EmbeddingSegmentsSum2 replacement') @@ -192,6 +191,7 @@ def replace_sub_graph(self, graph: Graph, match: dict): sparse_fill_empty_rows = match['sparse_fill_empty_rows'] gather = match['gather'] select = match['select'] + where0 = match['where0'] output_node_name = select.soft_get('name', select.id) log.debug('Found EmbeddingSegmentsSum2 pattern after {} with name {}'.format(sparse_fill_empty_rows.op, @@ -238,4 +238,4 @@ def replace_sub_graph(self, graph: Graph, match: dict): gather.in_port(0).disconnect() select.out_port(0).get_connection().set_source(embedding_segments_sum.out_port(0)) - graph.remove_nodes_from([gather0_1.id, gather0_2.id, greaterequal0.id, sparse_fill_empty_rows.id, select.id]) + graph.remove_nodes_from([gather0_1.id, gather0_2.id, greaterequal0.id, sparse_fill_empty_rows.id, select.id, where0.id]) From 80960f93cbadbdf3a36573b14c52e7d7254c46d9 Mon Sep 17 00:00:00 2001 From: "Maxim, Vafin" Date: Mon, 1 Jun 2020 16:42:58 +0300 Subject: [PATCH 19/31] Fix BOM --- model-optimizer/automation/package_BOM.txt | 1 + 1 file changed, 1 insertion(+) diff --git a/model-optimizer/automation/package_BOM.txt b/model-optimizer/automation/package_BOM.txt index e51152bb6ccb5c..a2f5b486314398 100644 --- a/model-optimizer/automation/package_BOM.txt +++ b/model-optimizer/automation/package_BOM.txt @@ -73,6 +73,7 @@ extensions/back/TransposeToPermute.py extensions/back/UselessConcatRemoval.py extensions/front/__init__.py extensions/front/ArgMaxSqueeze.py +extensions/front/ATenToEmbeddingBag.py extensions/front/AttributedClampNormalizer.py extensions/front/AttributedGatherNormalizer.py extensions/front/AttributedPadToPad.py From 2d6de5dad2ab4f7dec9445d75eadc735b80c0d2c Mon Sep 17 00:00:00 2001 From: Roman Kazantsev Date: Wed, 3 Jun 2020 18:43:47 +0500 Subject: [PATCH 20/31] Correct EmbeddingSegmentSum transform for Wide and Deep Add casting segment ids to i32 and remove ConstToResult sub-graph. Signed-off-by: Roman Kazantsev --- .../extensions/back/RemoveConstToResult.py | 47 ++++++++ .../front/tf/embedding_segments_sum.py | 10 +- .../front/tf/embedding_segments_sum_test.py | 108 +++++++++--------- 3 files changed, 111 insertions(+), 54 deletions(-) create mode 100644 model-optimizer/extensions/back/RemoveConstToResult.py diff --git a/model-optimizer/extensions/back/RemoveConstToResult.py b/model-optimizer/extensions/back/RemoveConstToResult.py new file mode 100644 index 00000000000000..84324b439af403 --- /dev/null +++ b/model-optimizer/extensions/back/RemoveConstToResult.py @@ -0,0 +1,47 @@ +""" + Copyright (C) 2020 Intel Corporation + + Licensed under the Apache License, Version 2.0 (the "License"); + you may not use this file except in compliance with the License. + You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +""" +import logging as log + +from mo.back.replacement import BackReplacementPattern +from mo.graph.graph import Graph + + +class RemoveConstToResult(BackReplacementPattern): + """ + Transformation looks for a sub-graph "Const->Result" + and removes Result node. + """ + enabled = True + #force_clean_up = True + + @staticmethod + def pattern(): + return dict( + nodes=[ + ('const_node', {'type': 'Const', 'kind': 'op'}), + ('const_data', {'kind': 'data'}), + ('result_node', {'type': 'Result', 'kind': 'op'}), + ], + edges=[ + ('const_node', 'const_data'), + ('const_data', 'result_node') + ] + ) + + @staticmethod + def replace_pattern(graph: Graph, match: dict): + result_node = match['result_node'] + graph.remove_node(result_node.id) diff --git a/model-optimizer/extensions/front/tf/embedding_segments_sum.py b/model-optimizer/extensions/front/tf/embedding_segments_sum.py index eee59e119ed12f..f15b643654e5f9 100644 --- a/model-optimizer/extensions/front/tf/embedding_segments_sum.py +++ b/model-optimizer/extensions/front/tf/embedding_segments_sum.py @@ -94,6 +94,7 @@ def replace_sub_graph(self, graph: Graph, match: dict): squeeze_for_indices = create_op_with_const_inputs(graph, Squeeze, {1: int64_array([1])}) split_for_dense_shape = create_op_with_const_inputs(graph, Split, {1: int64_array(0)}, {'num_splits': 2}) squeeze_to_scalar = create_op_with_const_inputs(graph, Squeeze, {1: int64_array([0])}) + cast_segment_ids = Cast(graph, {'name': output_node_name + '/CastSegmentIds', 'dst_type': np.int32}).create_node() cast_default_value = Cast(graph, {'name': output_node_name + '/CastDefaultValue', 'dst_type': np.int32}).create_node() cast_num_segments = Cast(graph, {'name': output_node_name + '/CastSegmentsNumber', 'dst_type': np.int32}).create_node() embedding_segments_sum = EmbeddingSegmentsSum(graph, {'name': output_node_name}).create_node() @@ -106,7 +107,9 @@ def replace_sub_graph(self, graph: Graph, match: dict): # split and connect segment ids gather0_1.in_port(0).get_connection().set_destination(split_for_indices.in_port(0)) squeeze_for_indices.in_port(0).connect(split_for_indices.out_port(0)) - embedding_segments_sum.in_port(2).connect(squeeze_for_indices.out_port(0)) + # TODO: remove casting once we start to support I64 model input + cast_segment_ids.in_port(0).connect(squeeze_for_indices.out_port(0)) + embedding_segments_sum.in_port(2).connect(cast_segment_ids.out_port(0)) # split and connect number of segments identity_spw.in_port(0).get_connection().set_destination(split_for_dense_shape.in_port(0)) squeeze_to_scalar.in_port(0).connect(split_for_dense_shape.out_port(0)) @@ -205,6 +208,7 @@ def replace_sub_graph(self, graph: Graph, match: dict): {'num_splits': 2, 'name': output_node_name + '/SplitForDenseShape'}) squeeze_to_scalar = create_op_with_const_inputs(graph, Squeeze, {1: int64_array([0])}) + cast_segment_ids = Cast(graph, {'name': output_node_name + '/CastSegmentIds', 'dst_type': np.int32}).create_node() cast_default_value = Cast(graph, {'name': output_node_name + '/CastDefaultValue', 'dst_type': np.int32}).create_node() cast_num_segments = Cast(graph, {'name': output_node_name + '/CastSegmentsNumber', 'dst_type': np.int32}).create_node() embedding_segments_sum = EmbeddingSegmentsSum(graph, {'name': output_node_name}).create_node() @@ -217,7 +221,9 @@ def replace_sub_graph(self, graph: Graph, match: dict): # split and connect segment ids gather0_1.in_port(0).get_connection().set_destination(split_for_indices.in_port(0)) squeeze_for_indices.in_port(0).connect(split_for_indices.out_port(0)) - embedding_segments_sum.in_port(2).connect(squeeze_for_indices.out_port(0)) + # TODO: remove casting once we start to support I64 model input + cast_segment_ids.in_port(0).connect(squeeze_for_indices.out_port(0)) + embedding_segments_sum.in_port(2).connect(cast_segment_ids.out_port(0)) # split and connect number of segments identity_spw.in_port(0).get_connection().set_destination(split_for_dense_shape.in_port(0)) squeeze_to_scalar.in_port(0).connect(split_for_dense_shape.out_port(0)) diff --git a/model-optimizer/extensions/front/tf/embedding_segments_sum_test.py b/model-optimizer/extensions/front/tf/embedding_segments_sum_test.py index 0b28dead6315ce..daed2c76b9e8a0 100644 --- a/model-optimizer/extensions/front/tf/embedding_segments_sum_test.py +++ b/model-optimizer/extensions/front/tf/embedding_segments_sum_test.py @@ -51,6 +51,7 @@ def test1(self): 'squeeze_for_indices': {'kind': 'op', 'op': 'Squeeze'}, 'split_for_dense_shape': {'kind': 'op', 'op': 'Split'}, 'squeeze_to_scalar': {'kind': 'op', 'op': 'Squeeze'}, + 'cast_segment_ids': {'kind': 'op', 'op': 'Cast'}, 'cast_default_value': {'kind': 'op', 'op': 'Cast'}, 'cast_number_segments': {'kind': 'op', 'op': 'Cast'}, 'embedding_segments_sum': {'kind': 'op', 'op': 'EmbeddingSegmentsSum'}, @@ -65,31 +66,31 @@ def test1(self): graph = build_graph(nodes_attributes, [('input_indices', 'gather0_1', {'out': 0, 'in': 0}), - ('input_dense_shape', 'identity_spw', {'out': 0, 'in': 0}), - ('input_values', 'greaterequal0', {'out': 0, 'in': 0}), - ('input_values', 'gather0_2', {'out': 0, 'in': 0}), - ('input_params_table', 'gather', {'out': 0, 'in': 0}), - ('input_default_value', 'sparse_fill_empty_rows', {'out': 0, 'in': 3}), + ('input_dense_shape', 'identity_spw', {'out': 0, 'in': 0}), + ('input_values', 'greaterequal0', {'out': 0, 'in': 0}), + ('input_values', 'gather0_2', {'out': 0, 'in': 0}), + ('input_params_table', 'gather', {'out': 0, 'in': 0}), + ('input_default_value', 'sparse_fill_empty_rows', {'out': 0, 'in': 3}), - ('gather0_1', 'sparse_fill_empty_rows', {'out': 0, 'in': 0}), - ('gather0_2', 'sparse_fill_empty_rows', {'out': 0, 'in': 1}), - ('identity_spw', 'sparse_fill_empty_rows', {'out': 0, 'in': 2}), - ('reshape0', 'gather0_1', {'out': 0, 'in': 1}), - ('reshape0', 'gather0_2', {'out': 0, 'in': 1}), - ('where0', 'reshape0', {'out': 0, 'in': 0}), - ('greaterequal0', 'where0', {'out': 0, 'in': 0}), - ('sparse_fill_empty_rows', 'unique', {'out': 1, 'in': 0}), - ('sparse_fill_empty_rows', 'strided_slice', {'out': 0, 'in': 0}), - ('sparse_fill_empty_rows', 'reshape', {'out': 2, 'in': 0}), - ('unique', 'sparse_segment_sum', {'out': 1, 'in': 1}), - ('unique', 'gather', {'out': 0, 'in': 1}), - ('strided_slice', 'cast', {'out': 0, 'in': 0}), - ('gather', 'sparse_segment_sum', {'out': 0, 'in': 0}), - ('cast', 'sparse_segment_sum', {'out': 0, 'in': 2}), - ('sparse_segment_sum', 'select', {'out': 0, 'in': 2}), - ('reshape', 'tile', {'out': 0, 'in': 0}), - ('tile', 'select', {'out': 0, 'in': 0}), - ('select', 'last', {'out': 0, 'in': 0}), + ('gather0_1', 'sparse_fill_empty_rows', {'out': 0, 'in': 0}), + ('gather0_2', 'sparse_fill_empty_rows', {'out': 0, 'in': 1}), + ('identity_spw', 'sparse_fill_empty_rows', {'out': 0, 'in': 2}), + ('reshape0', 'gather0_1', {'out': 0, 'in': 1}), + ('reshape0', 'gather0_2', {'out': 0, 'in': 1}), + ('where0', 'reshape0', {'out': 0, 'in': 0}), + ('greaterequal0', 'where0', {'out': 0, 'in': 0}), + ('sparse_fill_empty_rows', 'unique', {'out': 1, 'in': 0}), + ('sparse_fill_empty_rows', 'strided_slice', {'out': 0, 'in': 0}), + ('sparse_fill_empty_rows', 'reshape', {'out': 2, 'in': 0}), + ('unique', 'sparse_segment_sum', {'out': 1, 'in': 1}), + ('unique', 'gather', {'out': 0, 'in': 1}), + ('strided_slice', 'cast', {'out': 0, 'in': 0}), + ('gather', 'sparse_segment_sum', {'out': 0, 'in': 0}), + ('cast', 'sparse_segment_sum', {'out': 0, 'in': 2}), + ('sparse_segment_sum', 'select', {'out': 0, 'in': 2}), + ('reshape', 'tile', {'out': 0, 'in': 0}), + ('tile', 'select', {'out': 0, 'in': 0}), + ('select', 'last', {'out': 0, 'in': 0}), ], nodes_with_edges_only=True) graph.stage = 'front' EmbeddingSegmentsSumFrontReplacer().find_and_replace_pattern(graph) @@ -99,7 +100,8 @@ def test1(self): ('split_for_indices_axis', 'split_for_indices', {'in': 1}), ('split_for_indices', 'squeeze_for_indices', {'in': 0}), ('squeeze_for_indices_axis', 'squeeze_for_indices', {'in': 1}), - ('squeeze_for_indices', 'embedding_segments_sum', {'in': 2, 'out': 0}), + ('squeeze_for_indices', 'cast_segment_ids', {'in': 0}), + ('cast_segment_ids', 'embedding_segments_sum', {'in': 2, 'out': 0}), ('input_values', 'embedding_segments_sum', {'in': 1}), ('input_dense_shape', 'split_for_dense_shape', {'in': 0}), ('split_for_dense_shape_axis', 'split_for_dense_shape', {'in': 1}), @@ -146,6 +148,7 @@ def test2(self): 'squeeze_for_indices': {'kind': 'op', 'op': 'Squeeze'}, 'split_for_dense_shape': {'kind': 'op', 'op': 'Split'}, 'squeeze_to_scalar': {'kind': 'op', 'op': 'Squeeze'}, + 'cast_segment_ids': {'kind': 'op', 'op': 'Cast'}, 'cast_default_value': {'kind': 'op', 'op': 'Cast'}, 'cast_number_segments': {'kind': 'op', 'op': 'Cast'}, 'embedding_segments_sum': {'kind': 'op', 'op': 'EmbeddingSegmentsSum'}, @@ -160,33 +163,33 @@ def test2(self): graph = build_graph(nodes_attributes, [('input_indices', 'gather0_1', {'out': 0, 'in': 0}), - ('input_dense_shape', 'identity_spw', {'out': 0, 'in': 0}), - ('input_values', 'greaterequal0', {'out': 0, 'in': 0}), - ('input_values', 'gather0_2', {'out': 0, 'in': 0}), - ('input_params_table', 'gather', {'out': 0, 'in': 0}), - ('input_default_value', 'sparse_fill_empty_rows', {'out': 0, 'in': 3}), + ('input_dense_shape', 'identity_spw', {'out': 0, 'in': 0}), + ('input_values', 'greaterequal0', {'out': 0, 'in': 0}), + ('input_values', 'gather0_2', {'out': 0, 'in': 0}), + ('input_params_table', 'gather', {'out': 0, 'in': 0}), + ('input_default_value', 'sparse_fill_empty_rows', {'out': 0, 'in': 3}), - ('identity_spw', 'sparse_fill_empty_rows', {'out': 0, 'in': 2}), - ('gather0_1', 'sparse_fill_empty_rows', {'out': 0, 'in': 0}), - ('gather0_2', 'sparse_fill_empty_rows', {'out': 0, 'in': 1}), - ('reshape0', 'gather0_1', {'out': 0, 'in': 1}), - ('reshape0', 'gather0_2', {'out': 0, 'in': 1}), - ('where0', 'reshape0', {'out': 0, 'in': 0}), - ('greaterequal0', 'where0', {'out': 0, 'in': 0}), - ('sparse_fill_empty_rows', 'unique', {'out': 1, 'in': 0}), - ('sparse_fill_empty_rows', 'strided_slice', {'out': 0, 'in': 0}), - ('sparse_fill_empty_rows', 'reshape', {'out': 2, 'in': 0}), - ('unique', 'sparse_segment_sum', {'out': 1, 'in': 1}), - ('unique', 'gather', {'out': 0, 'in': 1}), - ('strided_slice', 'cast', {'out': 0, 'in': 0}), - ('gather', 'identity', {'out': 0, 'in': 0}), - ('identity', 'identity_1', {'out': 0, 'in': 0}), - ('identity_1', 'sparse_segment_sum', {'out': 0, 'in': 0}), - ('cast', 'sparse_segment_sum', {'out': 0, 'in': 2}), - ('sparse_segment_sum', 'select', {'out': 0, 'in': 2}), - ('reshape', 'tile', {'out': 0, 'in': 0}), - ('tile', 'select', {'out': 0, 'in': 0}), - ('select', 'last', {'out': 0, 'in': 0})], + ('identity_spw', 'sparse_fill_empty_rows', {'out': 0, 'in': 2}), + ('gather0_1', 'sparse_fill_empty_rows', {'out': 0, 'in': 0}), + ('gather0_2', 'sparse_fill_empty_rows', {'out': 0, 'in': 1}), + ('reshape0', 'gather0_1', {'out': 0, 'in': 1}), + ('reshape0', 'gather0_2', {'out': 0, 'in': 1}), + ('where0', 'reshape0', {'out': 0, 'in': 0}), + ('greaterequal0', 'where0', {'out': 0, 'in': 0}), + ('sparse_fill_empty_rows', 'unique', {'out': 1, 'in': 0}), + ('sparse_fill_empty_rows', 'strided_slice', {'out': 0, 'in': 0}), + ('sparse_fill_empty_rows', 'reshape', {'out': 2, 'in': 0}), + ('unique', 'sparse_segment_sum', {'out': 1, 'in': 1}), + ('unique', 'gather', {'out': 0, 'in': 1}), + ('strided_slice', 'cast', {'out': 0, 'in': 0}), + ('gather', 'identity', {'out': 0, 'in': 0}), + ('identity', 'identity_1', {'out': 0, 'in': 0}), + ('identity_1', 'sparse_segment_sum', {'out': 0, 'in': 0}), + ('cast', 'sparse_segment_sum', {'out': 0, 'in': 2}), + ('sparse_segment_sum', 'select', {'out': 0, 'in': 2}), + ('reshape', 'tile', {'out': 0, 'in': 0}), + ('tile', 'select', {'out': 0, 'in': 0}), + ('select', 'last', {'out': 0, 'in': 0})], nodes_with_edges_only=True) graph.stage = 'front' EmbeddingSegmentsSumFrontReplacer2().find_and_replace_pattern(graph) @@ -196,7 +199,8 @@ def test2(self): ('split_for_indices_axis', 'split_for_indices', {'in': 1}), ('split_for_indices', 'squeeze_for_indices', {'in': 0}), ('squeeze_for_indices_axis', 'squeeze_for_indices', {'in': 1}), - ('squeeze_for_indices', 'embedding_segments_sum', {'in': 2, 'out': 0}), + ('squeeze_for_indices', 'cast_segment_ids', {'in': 0}), + ('cast_segment_ids', 'embedding_segments_sum', {'in': 2, 'out': 0}), ('input_values', 'embedding_segments_sum', {'in': 1}), ('input_dense_shape', 'split_for_dense_shape', {'in': 0}), ('split_for_dense_shape_axis', 'split_for_dense_shape', {'in': 1}), From c03fc6b52bf96ee5c3f3dfe8f8c366fb79c37d85 Mon Sep 17 00:00:00 2001 From: Roman Kazantsev Date: Wed, 3 Jun 2020 18:53:57 +0500 Subject: [PATCH 21/31] Update BOM with RemoveConstToResult transform Signed-off-by: Roman Kazantsev --- model-optimizer/automation/package_BOM.txt | 1 + 1 file changed, 1 insertion(+) diff --git a/model-optimizer/automation/package_BOM.txt b/model-optimizer/automation/package_BOM.txt index a2f5b486314398..5710991733a102 100644 --- a/model-optimizer/automation/package_BOM.txt +++ b/model-optimizer/automation/package_BOM.txt @@ -52,6 +52,7 @@ extensions/back/ReadValueAssignToMemory.py extensions/back/ReduceToPooling.py extensions/back/ReduceTransposeDimensions.py extensions/back/remove_last_softmax_pattern.py +extensions/back/RemoveConstToResult.py extensions/back/RemoveUselessConvert.py extensions/back/Reshape0DToSqueeze.py extensions/back/ReshapeMutation.py From fbf745f438f69d47dd049426409d31cbe8781da8 Mon Sep 17 00:00:00 2001 From: Roman Kazantsev Date: Thu, 4 Jun 2020 10:01:18 +0500 Subject: [PATCH 22/31] Add more comments for RemoveConstToResult transformation Signed-off-by: Roman Kazantsev --- model-optimizer/extensions/back/RemoveConstToResult.py | 8 +++----- 1 file changed, 3 insertions(+), 5 deletions(-) diff --git a/model-optimizer/extensions/back/RemoveConstToResult.py b/model-optimizer/extensions/back/RemoveConstToResult.py index 84324b439af403..21bbc567e407cf 100644 --- a/model-optimizer/extensions/back/RemoveConstToResult.py +++ b/model-optimizer/extensions/back/RemoveConstToResult.py @@ -13,19 +13,17 @@ See the License for the specific language governing permissions and limitations under the License. """ -import logging as log - from mo.back.replacement import BackReplacementPattern from mo.graph.graph import Graph class RemoveConstToResult(BackReplacementPattern): """ - Transformation looks for a sub-graph "Const->Result" - and removes Result node. + Transformation looks for a sub-graph "Const->Result" and removes Result node. + Currently IE is unable to handle such graph so this transformation removes to work around this case. + For instance, this case appears for Wide and Deep model. """ enabled = True - #force_clean_up = True @staticmethod def pattern(): From 1ba3ccca8fd32214c1dbb4ae9f754be01a915b60 Mon Sep 17 00:00:00 2001 From: Roman Kazantsev Date: Thu, 4 Jun 2020 23:04:58 +0500 Subject: [PATCH 23/31] Remove useless logging in EmbeddingSegmentsSum transformation Signed-off-by: Roman Kazantsev --- model-optimizer/extensions/front/tf/embedding_segments_sum.py | 2 -- 1 file changed, 2 deletions(-) diff --git a/model-optimizer/extensions/front/tf/embedding_segments_sum.py b/model-optimizer/extensions/front/tf/embedding_segments_sum.py index f15b643654e5f9..b033ae7cd2cbbe 100644 --- a/model-optimizer/extensions/front/tf/embedding_segments_sum.py +++ b/model-optimizer/extensions/front/tf/embedding_segments_sum.py @@ -36,7 +36,6 @@ class EmbeddingSegmentsSumFrontReplacer(FrontReplacementSubgraph): enabled = True def pattern(self): - log.debug('Enabled EmbeddingSegmentsSum replacement') return dict( nodes=[ ('identity_spw', dict(op='Identity')), @@ -142,7 +141,6 @@ class EmbeddingSegmentsSumFrontReplacer2(FrontReplacementSubgraph): enabled = True def pattern(self): - log.debug('Enabled EmbeddingSegmentsSum2 replacement') return dict( nodes=[ ('identity_spw', dict(op='Identity')), From 47fc039d33fe41aa8f10e6d9bd2fc3ecd45cbbcc Mon Sep 17 00:00:00 2001 From: "Maxim, Vafin" Date: Fri, 5 Jun 2020 10:06:16 +0300 Subject: [PATCH 24/31] Small fixes --- model-optimizer/extensions/front/ATenToEmbeddingBag.py | 8 ++++---- model-optimizer/extensions/middle/EmbeddingBagResolver.py | 2 +- 2 files changed, 5 insertions(+), 5 deletions(-) diff --git a/model-optimizer/extensions/front/ATenToEmbeddingBag.py b/model-optimizer/extensions/front/ATenToEmbeddingBag.py index 769dc669ac6b04..6ff4d52a82dad5 100644 --- a/model-optimizer/extensions/front/ATenToEmbeddingBag.py +++ b/model-optimizer/extensions/front/ATenToEmbeddingBag.py @@ -27,14 +27,14 @@ class AtenToEmbeddingBag(FrontReplacementPattern): def find_and_replace_pattern(self, graph: Graph): for node in graph.get_op_nodes(op='ATen', operator='embedding_bag'): - node_name = node.name + node_name = node.soft_get('name', node.id) rename_node(node, node_name + '/TBR') embedding_bag = ATenEmbeddingBag(graph, {'name': node_name, 'mode': node.soft_get('mode', 1)}).create_node() rename_node(embedding_bag, node_name) node.in_port(0).get_connection().set_destination(embedding_bag.in_port(0)) node.in_port(1).get_connection().set_destination(embedding_bag.in_port(1)) - if node.has_port('in', 2) and not node.in_port(2).disconnected(): + if node.is_in_port_connected(2): node.in_port(2).get_connection().set_destination(embedding_bag.in_port(2)) - if node.has_port('in', 3) and not node.in_port(3).disconnected(): - node.in_port(2).get_connection().set_destination(embedding_bag.in_port(3)) + if node.is_in_port_connected(3): + node.in_port(3).get_connection().set_destination(embedding_bag.in_port(3)) node.out_port(0).get_connection().set_source(embedding_bag.out_port(0)) diff --git a/model-optimizer/extensions/middle/EmbeddingBagResolver.py b/model-optimizer/extensions/middle/EmbeddingBagResolver.py index f92c5f60ff96f4..67e4418095a72b 100644 --- a/model-optimizer/extensions/middle/EmbeddingBagResolver.py +++ b/model-optimizer/extensions/middle/EmbeddingBagResolver.py @@ -35,7 +35,7 @@ def find_and_replace_pattern(self, graph: Graph): for node in graph.get_op_nodes(op='ATenEmbeddingBag'): assert node.soft_get('mode') == 0, 'ATen::embedding_bag has unsupported mode, only "sum" ' \ 'mode is supported for node {}.'.format(node.id) - node_name = node.name + node_name = node.soft_get('name', node.id) rename_node(node, node_name + '/TBR') is_packed = False if len(node.in_ports()) < 3 or node.in_port(2).disconnected(): From 4da1a3024b8e81b7134decc6b759013c48d7da90 Mon Sep 17 00:00:00 2001 From: "Maxim, Vafin" Date: Fri, 5 Jun 2020 15:24:16 +0300 Subject: [PATCH 25/31] Move EmbeddingBag resolving back to front phase --- model-optimizer/automation/package_BOM.txt | 1 - .../extensions/front/ATenToEmbeddingBag.py | 59 ++++++- .../front/ATenToEmbeddingBag_test.py | 163 ++++++++++++++---- .../extensions/middle/EmbeddingBagResolver.py | 69 -------- .../middle/EmbeddingBagResolver_test.py | 133 -------------- .../extensions/ops/embedding_bag.py | 26 +-- 6 files changed, 188 insertions(+), 263 deletions(-) delete mode 100644 model-optimizer/extensions/middle/EmbeddingBagResolver.py delete mode 100644 model-optimizer/extensions/middle/EmbeddingBagResolver_test.py diff --git a/model-optimizer/automation/package_BOM.txt b/model-optimizer/automation/package_BOM.txt index aaf8ce75f45a0f..630ef2abe1f1cd 100644 --- a/model-optimizer/automation/package_BOM.txt +++ b/model-optimizer/automation/package_BOM.txt @@ -520,7 +520,6 @@ extensions/middle/DilatedConvolution.py extensions/middle/EltwiseChecker.py extensions/middle/EltwiseInputNormalization.py extensions/middle/EltwiseInputReshape.py -extensions/middle/EmbeddingBagResolver.py extensions/middle/FakeSplitOutputs.py extensions/middle/FusedBatchNormNonConstant.py extensions/middle/FusedBatchNormTraining.py diff --git a/model-optimizer/extensions/front/ATenToEmbeddingBag.py b/model-optimizer/extensions/front/ATenToEmbeddingBag.py index 6ff4d52a82dad5..8da70dc5c0d164 100644 --- a/model-optimizer/extensions/front/ATenToEmbeddingBag.py +++ b/model-optimizer/extensions/front/ATenToEmbeddingBag.py @@ -14,9 +14,18 @@ limitations under the License. """ -from extensions.ops.embedding_bag import ATenEmbeddingBag +from extensions.ops.embedding_bag import EmbeddingBagOffsetsSum, EmbeddingBagPackedSum +from extensions.ops.rank import Rank +from mo.front.common.partial_infer.utils import int64_array from mo.front.common.replacement import FrontReplacementPattern +from mo.front.tf.graph_utils import create_op_with_const_inputs from mo.graph.graph import Graph, rename_node +from mo.ops.broadcast import Broadcast +from mo.ops.concat import Concat +from mo.ops.shape import Shape +from mo.ops.unsqueeze import Unsqueeze +from mo.utils.shape import node_to_get_shape_value_of_indices, get_canonical_axis_index_node, \ + get_shape_values_by_indices_node class AtenToEmbeddingBag(FrontReplacementPattern): @@ -27,14 +36,52 @@ class AtenToEmbeddingBag(FrontReplacementPattern): def find_and_replace_pattern(self, graph: Graph): for node in graph.get_op_nodes(op='ATen', operator='embedding_bag'): + assert node.soft_get('mode') == 0, 'ATen::embedding_bag has unsupported mode, only "sum" ' \ + 'mode is supported for node {}.'.format(node.id) node_name = node.soft_get('name', node.id) rename_node(node, node_name + '/TBR') - embedding_bag = ATenEmbeddingBag(graph, {'name': node_name, 'mode': node.soft_get('mode', 1)}).create_node() + is_packed = False + if len(node.in_ports()) < 3 or node.in_port(2).disconnected(): + is_packed = True + embedding_bag = EmbeddingBagPackedSum(graph, {'name': node_name}).create_node() + else: + embedding_bag = EmbeddingBagOffsetsSum(graph, {'name': node_name}).create_node() + node.in_port(2).get_connection().set_destination(embedding_bag.in_port(2)) rename_node(embedding_bag, node_name) node.in_port(0).get_connection().set_destination(embedding_bag.in_port(0)) node.in_port(1).get_connection().set_destination(embedding_bag.in_port(1)) - if node.is_in_port_connected(2): - node.in_port(2).get_connection().set_destination(embedding_bag.in_port(2)) - if node.is_in_port_connected(3): - node.in_port(3).get_connection().set_destination(embedding_bag.in_port(3)) node.out_port(0).get_connection().set_source(embedding_bag.out_port(0)) + if len(node.in_ports()) == 4 and not node.in_port(3).disconnected(): + if is_packed: + node.in_port(3).get_connection().set_destination(embedding_bag.in_port(2)) + else: + # connect per_sample_weights + node.in_port(3).get_connection().set_destination(embedding_bag.in_port(4)) + + weights_shape_node = Shape(graph, {'name': node_name + '/WeightsShape'}).create_node() + + weights_rank_node = Rank(graph, {'name': node_name + '/WeightsRank'}).create_node() + last_dim_node = get_canonical_axis_index_node(weights_rank_node, -1) + weights_last_dim = get_shape_values_by_indices_node(weights_shape_node, last_dim_node) + + weights_first_dim = node_to_get_shape_value_of_indices(weights_shape_node, [0]) + + zero_col_node = create_op_with_const_inputs(graph, Broadcast, {0: int64_array([0])}, + {'name': node_name + '/Broadcast'}) + zero_col_node.in_port(1).connect(weights_last_dim.out_port(0)) + + default_embeddings_node = create_op_with_const_inputs(graph, Unsqueeze, {1: int64_array(0)}, + {'name': node_name + '/Unsqueeze'}) + default_embeddings_node.in_port(0).connect(zero_col_node.out_port(0)) + + # expand embedding table with zeros + weights_concat = Concat(graph, {'axis': 0, 'in_ports_count': 2, + 'name': node_name + '/Concat'}).create_node() + embedding_bag.in_port(0).get_connection().set_destination(weights_concat.in_port(0)) + weights_concat.in_port(0).get_connection().add_destination(weights_shape_node.in_port(0)) + weights_concat.in_port(0).get_connection().add_destination(weights_rank_node.in_port(0)) + weights_concat.in_port(1).connect(default_embeddings_node.out_port(0)) + weights_concat.out_port(0).connect(embedding_bag.in_port(0)) + + # point default index to expanded part of embedding table + weights_first_dim.out_port(0).connect(embedding_bag.in_port(3)) diff --git a/model-optimizer/extensions/front/ATenToEmbeddingBag_test.py b/model-optimizer/extensions/front/ATenToEmbeddingBag_test.py index 9783c7cd08cb35..bade2da38dbc9d 100644 --- a/model-optimizer/extensions/front/ATenToEmbeddingBag_test.py +++ b/model-optimizer/extensions/front/ATenToEmbeddingBag_test.py @@ -16,46 +16,147 @@ import unittest +import numpy as np + from extensions.front.ATenToEmbeddingBag import AtenToEmbeddingBag +from mo.front.common.partial_infer.utils import int64_array from mo.utils.ir_engine.compare_graphs import compare_graphs -from mo.utils.unittest.graph import build_graph - -nodes_attributes = { - 'weights_inp': {'shape': None, 'type': 'Parameter', 'kind': 'op', 'op': 'Parameter'}, - 'indices_inp': {'shape': None, 'type': 'Parameter', 'kind': 'op', 'op': 'Parameter'}, - 'offsets_inp': {'shape': None, 'type': 'Parameter', 'kind': 'op', 'op': 'Parameter'}, - 'aten': {'type': None, 'kind': 'op', 'op': 'ATen', 'mode': 0, 'operator': 'embedding_bag', 'name': 'my_aten'}, - 'result': {'type': 'Result', 'value': None, 'kind': 'op', 'op': 'Result'}, - - # new EmbeddingBag layer - 'emb_bag': {'type': None, 'kind': 'op', 'op': 'ATenEmbeddingBag', 'mode': 0}, -} +from mo.utils.unittest.graph import build_graph, result, \ + regular_op, const class AtenToEmbeddingBagTest(unittest.TestCase): def test(self): - graph = build_graph(nodes_attributes, - [('weights_inp', 'aten', {'in': 0, 'out': 0}), - ('indices_inp', 'aten', {'in': 1, 'out': 0}), - ('offsets_inp', 'aten', {'in': 2, 'out': 0}), - ('aten', 'result', {'in': 0, 'out': 0}), - ], - {}, nodes_with_edges_only=True) - - graph_ref = build_graph(nodes_attributes, - [('weights_inp', 'emb_bag', {'in': 0, 'out': 0}), - ('indices_inp', 'emb_bag', {'in': 1, 'out': 0}), - ('offsets_inp', 'emb_bag', {'in': 2, 'out': 0}), - ('emb_bag', 'result', {'in': 0, 'out': 0}), - ], - {}, nodes_with_edges_only=True) + nodes = { + **const('weights_inp', np.random.randn(100, 2)), + **regular_op('indices_inp', {'type': 'Parameter'}), + **regular_op('offsets_inp', {'type': 'Parameter'}), + **regular_op('aten', {'type': None, 'kind': 'op', 'op': 'ATen', 'operator': 'embedding_bag', 'mode': 0, + 'name': 'my_aten'}), + + **regular_op('emb_bag', {'type': 'EmbeddingBagOffsetsSum', 'kind': 'op', 'op': 'EmbeddingBagOffsetsSum'}), + **result('result'), + } + edges = [('weights_inp', 'aten'), + ('indices_inp', 'aten'), + ('offsets_inp', 'aten'), + ('aten', 'result'), + ] + graph = build_graph(nodes, edges) + + graph.graph['layout'] = 'NCHW' + graph.stage = 'front' + + edges_ref = [('weights_inp', 'emb_bag'), + ('indices_inp', 'emb_bag'), + ('offsets_inp', 'emb_bag'), + ('emb_bag', 'result'), + ] + + graph_ref = build_graph(nodes, edges_ref) + + AtenToEmbeddingBag().find_and_replace_pattern(graph) + + (flag, resp) = compare_graphs(graph, graph_ref, 'result') + self.assertTrue(flag, resp) + + def test_packed(self): + nodes = { + **const('weights_inp', np.random.randn(100, 4)), + **regular_op('indices_inp', {'type': 'Parameter'}), + **regular_op('aten', {'type': None, 'kind': 'op', 'op': 'ATen', 'operator': 'embedding_bag', 'mode': 0, + 'name': 'my_aten'}), + + **regular_op('emb_bag', {'type': 'EmbeddingBagPackedSum', 'kind': 'op', + 'op': 'EmbeddingBagPackedSum'}), + **result('result'), + } + edges = [('weights_inp', 'aten'), + ('indices_inp', 'aten'), + ('aten', 'result'), + ] + graph = build_graph(nodes, edges) graph.graph['layout'] = 'NCHW' graph.stage = 'front' - replacer = AtenToEmbeddingBag() - replacer.find_and_replace_pattern(graph) + edges_ref = [('weights_inp', 'emb_bag'), + ('indices_inp', 'emb_bag'), + ('emb_bag', 'result'), + ] + + graph_ref = build_graph(nodes, edges_ref) + + AtenToEmbeddingBag().find_and_replace_pattern(graph) + + (flag, resp) = compare_graphs(graph, graph_ref, 'result') + self.assertTrue(flag, resp) + + def test_per_sample_weights(self): + nodes = { + **const('weights_inp', np.random.randn(100, 2)), + **regular_op('indices_inp', {'type': 'Parameter'}), + **regular_op('offsets_inp', {'type': 'Parameter'}), + **regular_op('per_sample_weights', {'type': 'Parameter'}), + **regular_op('aten', {'type': None, 'kind': 'op', 'op': 'ATen', 'operator': 'embedding_bag', 'mode': 0, + 'name': 'my_aten'}), + + **regular_op('emb_bag', {'type': 'EmbeddingBagOffsetsSum', 'kind': 'op', + 'op': 'EmbeddingBagOffsetsSum'}), + **regular_op('WeightsRank', {'type': None, 'kind': 'op', 'op': 'Rank'}), + **regular_op('WeightsRank/axis', {'type': 'Add', 'kind': 'op', 'op': 'Add'}), + **regular_op('gather1', {'type': 'Gather', 'kind': 'op', 'op': 'Gather'}), + **regular_op('gather2', {'type': 'Gather', 'kind': 'op', 'op': 'Gather'}), + **regular_op('WeightsShape', {'type': 'ShapeOf', 'kind': 'op', 'op': 'ShapeOf'}), + **regular_op('Broadcast', {'type': 'Broadcast', 'kind': 'op', 'op': 'Broadcast'}), + **regular_op('Unsqueeze', {'type': 'Unsqueeze', 'kind': 'op', 'op': 'Unsqueeze'}), + **const('WeightsShape/Axis', int64_array(0)), + **const('zero1', int64_array(0)), + **const('zero2', int64_array(0)), + **const('Unsqueeze/value', int64_array(0)), + **const('Broadcast/value', int64_array(0)), + **const('neg', int64_array(-1)), + **regular_op('Concat', {'type': 'Concat', 'kind': 'op', 'op': 'Concat'}), + **result('result'), + } + edges = [('weights_inp', 'aten'), + ('indices_inp', 'aten'), + ('offsets_inp', 'aten'), + ('per_sample_weights', 'aten'), + ('aten', 'result'), + ] + graph = build_graph(nodes, edges, nodes_with_edges_only=True) + + graph.graph['layout'] = 'NCHW' + graph.stage = 'front' + + edges_ref = [('weights_inp', 'Concat', {'in': 0, 'out': 0}), + ('weights_inp', 'WeightsShape', {'in': 0, 'out': 0}), + ('weights_inp', 'WeightsRank', {'in': 0, 'out': 0}), + ('WeightsRank', 'WeightsRank/axis'), + ('neg', 'WeightsRank/axis'), + ('WeightsShape', 'gather1', {'in': 0, 'out': 0}), + ('WeightsRank/axis', 'gather1'), + ('WeightsShape/Axis', 'gather1'), + ('WeightsShape', 'gather2', {'in': 0, 'out': 0}), + ('zero1', 'gather2'), + ('zero2', 'gather2'), + ('Broadcast/value', 'Broadcast'), + ('gather1', 'Broadcast'), + ('Broadcast', 'Unsqueeze'), + ('Unsqueeze/value', 'Unsqueeze'), + ('Unsqueeze', 'Concat'), + ('Concat', 'emb_bag'), + ('indices_inp', 'emb_bag'), + ('offsets_inp', 'emb_bag'), + ('gather2', 'emb_bag'), + ('per_sample_weights', 'emb_bag'), + ('emb_bag', 'result'), + ] + + graph_ref = build_graph(nodes, edges_ref, nodes_with_edges_only=True) + + AtenToEmbeddingBag().find_and_replace_pattern(graph) - (flag, resp) = compare_graphs(graph, graph_ref, 'result', check_op_attrs=True) + (flag, resp) = compare_graphs(graph, graph_ref, 'result') self.assertTrue(flag, resp) - self.assertTrue(graph.node[graph.get_nodes_with_attributes(op='ATenEmbeddingBag')[0]]['name'] == 'my_aten') diff --git a/model-optimizer/extensions/middle/EmbeddingBagResolver.py b/model-optimizer/extensions/middle/EmbeddingBagResolver.py deleted file mode 100644 index 67e4418095a72b..00000000000000 --- a/model-optimizer/extensions/middle/EmbeddingBagResolver.py +++ /dev/null @@ -1,69 +0,0 @@ -""" - Copyright (C) 2018-2020 Intel Corporation - - Licensed under the Apache License, Version 2.0 (the "License"); - you may not use this file except in compliance with the License. - You may obtain a copy of the License at - - http://www.apache.org/licenses/LICENSE-2.0 - - Unless required by applicable law or agreed to in writing, software - distributed under the License is distributed on an "AS IS" BASIS, - WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - See the License for the specific language governing permissions and - limitations under the License. -""" - -import numpy as np - -from extensions.ops.embedding_bag import EmbeddingBagOffsetsSum, EmbeddingBagPackedSum -from mo.front.common.partial_infer.utils import int64_array -from mo.front.tf.graph_utils import create_op_with_const_inputs -from mo.graph.graph import Graph, rename_node -from mo.middle.replacement import MiddleReplacementPattern -from mo.ops.concat import Concat -from mo.ops.const import Const - - -class EmbeddingBagResolver(MiddleReplacementPattern): - """ - Converts the ATenEmbeddingBag layer to correct internal EmbeddingBag layer. - """ - enabled = True - - def find_and_replace_pattern(self, graph: Graph): - for node in graph.get_op_nodes(op='ATenEmbeddingBag'): - assert node.soft_get('mode') == 0, 'ATen::embedding_bag has unsupported mode, only "sum" ' \ - 'mode is supported for node {}.'.format(node.id) - node_name = node.soft_get('name', node.id) - rename_node(node, node_name + '/TBR') - is_packed = False - if len(node.in_ports()) < 3 or node.in_port(2).disconnected(): - is_packed = True - embedding_bag = EmbeddingBagPackedSum(graph, {'name': node_name}).create_node() - else: - embedding_bag = EmbeddingBagOffsetsSum(graph, {'name': node_name}).create_node() - node.in_port(2).get_connection().set_destination(embedding_bag.in_port(2)) - rename_node(embedding_bag, node_name) - node.in_port(0).get_connection().set_destination(embedding_bag.in_port(0)) - node.in_port(1).get_connection().set_destination(embedding_bag.in_port(1)) - node.out_port(0).get_connection().set_source(embedding_bag.out_port(0)) - if len(node.in_ports()) == 4 and not node.in_port(3).disconnected(): - if is_packed: - node.in_port(3).get_connection().set_destination(embedding_bag.in_port(2)) - else: - # connect per_sample_weights - node.in_port(3).get_connection().set_destination(embedding_bag.in_port(4)) - - weights_shape = embedding_bag.in_port(0).data.get_shape() - - # expand embedding table with zeros - default_embeddings = np.zeros([1, weights_shape[-1]]) - weights_concat = create_op_with_const_inputs(graph, Concat, {1: default_embeddings}, - {'axis': 0, 'in_ports_count': 2}) - embedding_bag.in_port(0).get_connection().set_destination(weights_concat.in_port(0)) - weights_concat.out_port(0).connect(embedding_bag.in_port(0)) - - # point default index to expanded part of embedding table - default_index = Const(graph, {'value': int64_array(weights_shape[0])}).create_node() - default_index.out_port(0).connect(embedding_bag.in_port(3)) diff --git a/model-optimizer/extensions/middle/EmbeddingBagResolver_test.py b/model-optimizer/extensions/middle/EmbeddingBagResolver_test.py deleted file mode 100644 index d964da69ccd1e0..00000000000000 --- a/model-optimizer/extensions/middle/EmbeddingBagResolver_test.py +++ /dev/null @@ -1,133 +0,0 @@ -""" - Copyright (C) 2020 Intel Corporation - - Licensed under the Apache License, Version 2.0 (the "License"); - you may not use this file except in compliance with the License. - You may obtain a copy of the License at - - http://www.apache.org/licenses/LICENSE-2.0 - - Unless required by applicable law or agreed to in writing, software - distributed under the License is distributed on an "AS IS" BASIS, - WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - See the License for the specific language governing permissions and - limitations under the License. -""" - -import unittest - -import numpy as np - -from extensions.middle.EmbeddingBagResolver import EmbeddingBagResolver -from mo.front.common.partial_infer.utils import int64_array -from mo.utils.ir_engine.compare_graphs import compare_graphs -from mo.utils.unittest.graph import build_graph, regular_op_with_shaped_data, valued_const_with_data, result, \ - connect - - -class AtenToEmbeddingBagTest(unittest.TestCase): - def test(self): - nodes = { - **valued_const_with_data('weights_inp', np.random.randn(100, 2)), - **regular_op_with_shaped_data('indices_inp', [20], {'type': 'Parameter'}), - **regular_op_with_shaped_data('offsets_inp', [10], {'type': 'Parameter'}), - **regular_op_with_shaped_data('aten', [10, 2], - {'type': None, 'kind': 'op', 'op': 'ATenEmbeddingBag', 'mode': 0, - 'name': 'my_aten'}), - - **regular_op_with_shaped_data('emb_bag', [10, 2], {'type': 'EmbeddingBagOffsetsSum', 'kind': 'op', - 'op': 'EmbeddingBagOffsetsSum'}), - **result('result'), - } - edges = [*connect('weights_inp', '0:aten'), - *connect('indices_inp', '1:aten'), - *connect('offsets_inp', '2:aten'), - *connect('aten', 'result'), - ] - graph = build_graph(nodes, edges) - - edges_ref = [*connect('weights_inp', '0:emb_bag'), - *connect('indices_inp', '1:emb_bag'), - *connect('offsets_inp', '2:emb_bag'), - *connect('emb_bag', 'result'), - ] - - graph_ref = build_graph(nodes, edges_ref) - - EmbeddingBagResolver().find_and_replace_pattern(graph) - - (flag, resp) = compare_graphs(graph, graph_ref, 'result') - self.assertTrue(flag, resp) - - def test_packed(self): - nodes = { - **valued_const_with_data('weights_inp', np.random.randn(100, 4)), - **regular_op_with_shaped_data('indices_inp', [10, 2], {'type': 'Parameter'}), - **regular_op_with_shaped_data('aten', [10, 4], - {'type': None, 'kind': 'op', 'op': 'ATenEmbeddingBag', 'mode': 0, - 'name': 'my_aten'}), - - **regular_op_with_shaped_data('emb_bag', [10, 4], {'type': 'EmbeddingBagPackedSum', 'kind': 'op', - 'op': 'EmbeddingBagPackedSum'}), - **result('result'), - } - edges = [*connect('weights_inp', '0:aten'), - *connect('indices_inp', '1:aten'), - *connect('aten', 'result'), - ] - graph = build_graph(nodes, edges) - - edges_ref = [*connect('weights_inp', '0:emb_bag'), - *connect('indices_inp', '1:emb_bag'), - *connect('emb_bag', 'result'), - ] - - graph_ref = build_graph(nodes, edges_ref) - - EmbeddingBagResolver().find_and_replace_pattern(graph) - - (flag, resp) = compare_graphs(graph, graph_ref, 'result') - self.assertTrue(flag, resp) - - def test_per_sample_weights(self): - nodes = { - **valued_const_with_data('weights_inp', np.random.randn(100, 2)), - **regular_op_with_shaped_data('indices_inp', [20], {'type': 'Parameter'}), - **regular_op_with_shaped_data('offsets_inp', [10], {'type': 'Parameter'}), - **regular_op_with_shaped_data('per_sample_weights', [20], {'type': 'Parameter'}), - **regular_op_with_shaped_data('aten', [10, 2], - {'type': None, 'kind': 'op', 'op': 'ATenEmbeddingBag', 'mode': 0, - 'name': 'my_aten'}), - - **regular_op_with_shaped_data('emb_bag', [10, 2], {'type': 'EmbeddingBagOffsetsSum', 'kind': 'op', - 'op': 'EmbeddingBagOffsetsSum'}), - **valued_const_with_data('zeros', np.zeros([1, 2])), - **regular_op_with_shaped_data('concat', None, {'type': 'Concat', 'kind': 'op', 'op': 'Concat'}), - 'def_index': {'kind': 'op', 'value': int64_array(100), 'shape': None, 'type': 'Const'}, - 'def_index_d': {'kind': 'data', 'value': None, 'shape': None}, - **result('result'), - } - edges = [*connect('weights_inp', '0:aten'), - *connect('indices_inp', '1:aten'), - *connect('offsets_inp', '2:aten'), - *connect('per_sample_weights', '3:aten'), - *connect('aten', 'result'), - ] - graph = build_graph(nodes, edges) - - edges_ref = [*connect('weights_inp', '0:concat'), - *connect('zeros', '1:concat'), - *connect('concat', '0:emb_bag'), - *connect('indices_inp', '1:emb_bag'), - *connect('offsets_inp', '2:emb_bag'), - *connect('def_index', '3:emb_bag'), - *connect('per_sample_weights', '4:emb_bag'), - *connect('emb_bag', 'result'), - ] - - graph_ref = build_graph(nodes, edges_ref) - - EmbeddingBagResolver().find_and_replace_pattern(graph) - - (flag, resp) = compare_graphs(graph, graph_ref, 'result') - self.assertTrue(flag, resp) diff --git a/model-optimizer/extensions/ops/embedding_bag.py b/model-optimizer/extensions/ops/embedding_bag.py index fc13dde08ae060..b65b039aaa23ac 100644 --- a/model-optimizer/extensions/ops/embedding_bag.py +++ b/model-optimizer/extensions/ops/embedding_bag.py @@ -65,7 +65,7 @@ def infer(node: Node): offsets_shape = node.in_port(2).data.get_shape() assert offsets_shape is not None and len(offsets_shape) == 1 - node.out_port(0).data.set_shape(np.concatenate((offsets_shape[:1], weights_shape[1:])).astype(np.int64)) + node.out_port(0).data.set_shape(np.concatenate((offsets_shape[:1], weights_shape[1:]))) class EmbeddingBagPackedSum(EmbeddingBagBase): @@ -87,7 +87,7 @@ def infer(node: Node): input_shape = node.in_port(1).data.get_shape() assert input_shape is not None - node.out_port(0).data.set_shape(np.concatenate((input_shape[:1], weights_shape[1:])).astype(np.int64)) + node.out_port(0).data.set_shape(np.concatenate((input_shape[:1], weights_shape[1:]))) class EmbeddingSegmentsSum(EmbeddingBagBase): @@ -113,25 +113,5 @@ def infer(node: Node): num_segments = node.in_port(3).data.get_value() assert num_segments is not None, "EmbeddingSegmentsSum should have a constant num_segments provided, but it " \ "doesn't for node: `{}`.".format(name) - output_shape = np.concatenate(([num_segments], weights_shape[1:])).astype(np.int64) + output_shape = np.concatenate(([num_segments], weights_shape[1:])) node.out_port(0).data.set_shape(output_shape) - - -class ATenEmbeddingBag(EmbeddingBagBase): - op = 'ATenEmbeddingBag' - op_type = None - version = None - in_ports_count = 4 - - @staticmethod - def infer(node: Node): - weights_shape = node.in_port(0).data.get_shape() - assert len(weights_shape) >= 2 - indices_shape = node.in_port(1).data.get_shape() - assert indices_shape is not None - if len(indices_shape) == 2: - node.out_port(0).data.set_shape(np.concatenate((indices_shape[:1], weights_shape[1:])).astype(np.int64)) - elif len(indices_shape) == 1: - offsets_shape = node.in_port(2).data.get_shape() - assert offsets_shape is not None and len(offsets_shape) == 1 - node.out_port(0).data.set_shape(np.concatenate((offsets_shape[:1], weights_shape[1:])).astype(np.int64)) From a296137724bce4c7a1b1578fcd0025c6a363ba05 Mon Sep 17 00:00:00 2001 From: "Maxim, Vafin" Date: Fri, 5 Jun 2020 15:55:36 +0300 Subject: [PATCH 26/31] Improve error messages --- .../extensions/ops/embedding_bag.py | 29 ++++++++++--------- 1 file changed, 15 insertions(+), 14 deletions(-) diff --git a/model-optimizer/extensions/ops/embedding_bag.py b/model-optimizer/extensions/ops/embedding_bag.py index b65b039aaa23ac..1d83db0a6375a3 100644 --- a/model-optimizer/extensions/ops/embedding_bag.py +++ b/model-optimizer/extensions/ops/embedding_bag.py @@ -54,16 +54,16 @@ def infer(node: Node): name = node.soft_get('name', node.id) connected_in_ports = {idx: port for idx, port in node.in_ports().items() if not port.disconnected()} - assert len(connected_in_ports) >= 3 and 0 in connected_in_ports and 1 in connected_in_ports and \ - 2 in connected_in_ports, "EmbeddingBag should have at least 3 connected input port, but it doesn't " \ - "for node: `{}`. Ports: {}".format(name, connected_in_ports) + assert len(connected_in_ports) >= 3 and all(p in connected_in_ports for p in [0, 1, 2]), \ + "EmbeddingBagOffsetsSum should have at least 3 connected input port, but it doesn't " \ + "for node: `{}`. Ports: {}".format(name, connected_in_ports) weights_shape = node.in_port(0).data.get_shape() - assert len(weights_shape) >= 2 - input_shape = node.in_port(1).data.get_shape() - assert input_shape is not None + assert len(weights_shape) >= 2,\ + "EmbeddingBagOffsetsSum should have at least 2D weights for node: `{}`".format(name) offsets_shape = node.in_port(2).data.get_shape() - assert offsets_shape is not None and len(offsets_shape) == 1 + assert offsets_shape is not None and len(offsets_shape) == 1,\ + "Rank of the offsets in EmbeddingBagOffsetsSum should be equal to 1 for node: `{}`".format(name) node.out_port(0).data.set_shape(np.concatenate((offsets_shape[:1], weights_shape[1:]))) @@ -78,14 +78,14 @@ def infer(node: Node): name = node.soft_get('name', node.id) connected_in_ports = {idx: port for idx, port in node.in_ports().items() if not port.disconnected()} - assert len(connected_in_ports) >= 2 and 0 in connected_in_ports and 1 in connected_in_ports, \ + assert len(connected_in_ports) >= 2 and all(p in connected_in_ports for p in [0, 1]), \ "EmbeddingBagPackedSum should have at least 2 connected input port, but it doesn't for node: `{}`. " \ "Ports: {}".format(name, connected_in_ports) weights_shape = node.in_port(0).data.get_shape() - assert len(weights_shape) >= 2 + assert len(weights_shape) >= 2, \ + "EmbeddingBagPackedSum should have at least 2D weights for node: `{}`".format(name) input_shape = node.in_port(1).data.get_shape() - assert input_shape is not None node.out_port(0).data.set_shape(np.concatenate((input_shape[:1], weights_shape[1:]))) @@ -100,16 +100,17 @@ def infer(node: Node): name = node.soft_get('name', node.id) connected_in_ports = {idx: port for idx, port in node.in_ports().items() if not port.disconnected()} - assert len(connected_in_ports) >= 4 and 0 in connected_in_ports and 1 in connected_in_ports and \ - 2 in connected_in_ports and 3 in connected_in_ports, \ + assert len(connected_in_ports) >= 4 and all(p in connected_in_ports for p in [0, 1, 2, 3]), \ "EmbeddingSegmentsSum should have at least 4 connected input port, but it doesn't for node: `{}`. " \ "Ports: {}".format(name, connected_in_ports) weights_shape = node.in_port(0).data.get_shape() - assert len(weights_shape) >= 2 + assert len(weights_shape) >= 2,\ + "EmbeddingSegmentsSum should have at least 2D weights for node: `{}`".format(name) indices_shape = node.in_port(1).data.get_shape() segment_ids = node.in_port(2).data.get_shape() - assert len(indices_shape) == 1 and len(segment_ids) == 1 and indices_shape == segment_ids + assert len(indices_shape) == 1 and len(segment_ids) == 1 and indices_shape == segment_ids,\ + "Both indices and segment_ids should have the same shape for node: `{}`".format(name) num_segments = node.in_port(3).data.get_value() assert num_segments is not None, "EmbeddingSegmentsSum should have a constant num_segments provided, but it " \ "doesn't for node: `{}`.".format(name) From 8df85b4f51597215efe4040d01a14c03f5814888 Mon Sep 17 00:00:00 2001 From: "Maxim, Vafin" Date: Fri, 5 Jun 2020 18:04:30 +0300 Subject: [PATCH 27/31] Fix typo in unittests --- model-optimizer/extensions/ops/embedding_bag_test.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/model-optimizer/extensions/ops/embedding_bag_test.py b/model-optimizer/extensions/ops/embedding_bag_test.py index 012dd7a1fd6709..beda49b9c88d74 100644 --- a/model-optimizer/extensions/ops/embedding_bag_test.py +++ b/model-optimizer/extensions/ops/embedding_bag_test.py @@ -52,17 +52,17 @@ class TestEmbeddingInfer(unittest.TestCase): def test_embedding_bag_offsets_sum(self): graph = build_graph(nodes, [ *connect('data', '0:embedding_bag_offsets'), - *connect('indices', '1:embedding_bag_offsets'), + *connect('indices1d', '1:embedding_bag_offsets'), *connect('offsets', '2:embedding_bag_offsets'), ('embedding_bag_offsets', 'embedding_bag_offsets_d', {'out': 0}), ('embedding_bag_offsets_d', 'output'), ], nodes_with_edges_only=True) - eb_node = Node(graph, 'embedding_bag') + eb_node = Node(graph, 'embedding_bag_offsets') EmbeddingBagOffsetsSum.infer(eb_node) self.assertTrue(np.array_equal(eb_node.out_port(0).data.get_shape(), int64_array([30, 8]))) - def test_embedding_bag_offsets_sum(self): + def test_embedding_bag_packed_sum(self): graph = build_graph(nodes, [ *connect('data', '0:embedding_bag_packed'), *connect('indices2d', '1:embedding_bag_packed'), From 71773aae007b05a92e334cb37663d46cf1ab94e8 Mon Sep 17 00:00:00 2001 From: Roman Kazantsev Date: Sun, 7 Jun 2020 22:58:01 +0500 Subject: [PATCH 28/31] Reimplement sparse_reshape middle transform Avoid deprecated API. Signed-off-by: Roman Kazantsev --- model-optimizer/automation/package_BOM.txt | 1 - .../extensions/back/RemoveConstToResult.py | 45 ------------------- .../back/SpecialNodesFinalization.py | 28 ++++++++++++ .../extensions/middle/sparse_reshape.py | 23 +++------- .../extensions/ops/sparse_reshape.py | 5 ++- 5 files changed, 37 insertions(+), 65 deletions(-) delete mode 100644 model-optimizer/extensions/back/RemoveConstToResult.py diff --git a/model-optimizer/automation/package_BOM.txt b/model-optimizer/automation/package_BOM.txt index 630ef2abe1f1cd..f2743f6195db10 100644 --- a/model-optimizer/automation/package_BOM.txt +++ b/model-optimizer/automation/package_BOM.txt @@ -52,7 +52,6 @@ extensions/back/ReadValueAssignToMemory.py extensions/back/ReduceToPooling.py extensions/back/ReduceTransposeDimensions.py extensions/back/remove_last_softmax_pattern.py -extensions/back/RemoveConstToResult.py extensions/back/RemoveUselessConvert.py extensions/back/Reshape0DToSqueeze.py extensions/back/ReshapeMutation.py diff --git a/model-optimizer/extensions/back/RemoveConstToResult.py b/model-optimizer/extensions/back/RemoveConstToResult.py deleted file mode 100644 index 21bbc567e407cf..00000000000000 --- a/model-optimizer/extensions/back/RemoveConstToResult.py +++ /dev/null @@ -1,45 +0,0 @@ -""" - Copyright (C) 2020 Intel Corporation - - Licensed under the Apache License, Version 2.0 (the "License"); - you may not use this file except in compliance with the License. - You may obtain a copy of the License at - - http://www.apache.org/licenses/LICENSE-2.0 - - Unless required by applicable law or agreed to in writing, software - distributed under the License is distributed on an "AS IS" BASIS, - WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - See the License for the specific language governing permissions and - limitations under the License. -""" -from mo.back.replacement import BackReplacementPattern -from mo.graph.graph import Graph - - -class RemoveConstToResult(BackReplacementPattern): - """ - Transformation looks for a sub-graph "Const->Result" and removes Result node. - Currently IE is unable to handle such graph so this transformation removes to work around this case. - For instance, this case appears for Wide and Deep model. - """ - enabled = True - - @staticmethod - def pattern(): - return dict( - nodes=[ - ('const_node', {'type': 'Const', 'kind': 'op'}), - ('const_data', {'kind': 'data'}), - ('result_node', {'type': 'Result', 'kind': 'op'}), - ], - edges=[ - ('const_node', 'const_data'), - ('const_data', 'result_node') - ] - ) - - @staticmethod - def replace_pattern(graph: Graph, match: dict): - result_node = match['result_node'] - graph.remove_node(result_node.id) diff --git a/model-optimizer/extensions/back/SpecialNodesFinalization.py b/model-optimizer/extensions/back/SpecialNodesFinalization.py index 09422d3e8a9a73..99a88f2bcfc682 100644 --- a/model-optimizer/extensions/back/SpecialNodesFinalization.py +++ b/model-optimizer/extensions/back/SpecialNodesFinalization.py @@ -130,6 +130,34 @@ def find_and_replace_pattern(self, graph: Graph): graph.remove_node(node.id) +class RemoveConstToResult(BackReplacementPattern): + """ + Transformation looks for a sub-graph "Const->Result" and removes Result node. + Currently IE is unable to handle such graph so this transformation removes to work around this case. + For instance, this case appears for Wide and Deep model. + """ + enabled = True + + @staticmethod + def pattern(): + return dict( + nodes=[ + ('const_node', {'type': 'Const', 'kind': 'op'}), + ('const_data', {'kind': 'data'}), + ('result_node', {'type': 'Result', 'kind': 'op'}), + ], + edges=[ + ('const_node', 'const_data'), + ('const_data', 'result_node') + ] + ) + + @staticmethod + def replace_pattern(graph: Graph, match: dict): + result_node = match['result_node'] + graph.remove_node(result_node.id) + + class NormalizeTI(BackReplacementPattern): """ This transformation is used while generating IR of lower than 10 version diff --git a/model-optimizer/extensions/middle/sparse_reshape.py b/model-optimizer/extensions/middle/sparse_reshape.py index 3282049fd1292f..a44bab46111b19 100644 --- a/model-optimizer/extensions/middle/sparse_reshape.py +++ b/model-optimizer/extensions/middle/sparse_reshape.py @@ -59,23 +59,10 @@ def replace_pattern(self, graph: Graph, match: dict): if not np.array_equal(input_shape_value, output_shape_value): raise Error("Input shape and output shape values must be equal for node {}".format(sparse_reshape.id)) - input_data_node1 = sparse_reshape.in_node(0) - input_data_node2 = sparse_reshape.in_node(1) - graph.remove_edge(input_data_node1.id, sparse_reshape.id) - graph.remove_edge(input_data_node2.id, sparse_reshape.id) if 0 in sparse_reshape.out_nodes(): - output_data_node1 = sparse_reshape.out_node(0) - graph.remove_edge(sparse_reshape.id, output_data_node1.id) - merge_data_nodes(graph, output_data_node1, input_data_node1) + sparse_reshape.out_port(0).get_connection().set_source(sparse_reshape.in_port(0).get_source()) + if 1 in sparse_reshape.out_nodes(): - output_data_node2 = sparse_reshape.out_node(1) - graph.remove_edge(sparse_reshape.id, output_data_node2.id) - merge_data_nodes(graph, output_data_node2, input_data_node2) - graph.remove_nodes_from([sparse_reshape.id, input_data_node1.id, input_data_node2.id]) - - # TODO: investigate why this second way does not work - # sparse_reshape.out_port(0).get_connection().set_source(sparse_reshape.in_port(0).get_source()) - # sparse_reshape.out_port(1).get_connection().set_source(sparse_reshape.in_port(1).get_source()) - # sparse_reshape.in_port(0).get_connection().set_destination(sparse_reshape.in_port(0) - # sparse_reshape.in_port(2).disconnect() - # graph.remove_nodes_from([sparse_reshape.id]) + sparse_reshape.out_port(1).get_connection().set_source(sparse_reshape.in_port(1).get_source()) + + graph.remove_nodes_from([sparse_reshape.id]) diff --git a/model-optimizer/extensions/ops/sparse_reshape.py b/model-optimizer/extensions/ops/sparse_reshape.py index 2a2c75ce6c2d02..18c1d062af425f 100644 --- a/model-optimizer/extensions/ops/sparse_reshape.py +++ b/model-optimizer/extensions/ops/sparse_reshape.py @@ -42,6 +42,7 @@ def supported_attrs(self): @staticmethod def infer(node: Node): input_indices_shape = node.in_port(0).data.get_shape() + input_indices_value = node.in_port(0).data.get_value() input_shape_value = node.in_port(1).data.get_value() new_shape_value = node.in_port(2).data.get_value() new_shape_shape = node.in_port(2).data.get_shape() @@ -60,4 +61,6 @@ def infer(node: Node): output_indices_shape = np.concatenate((input_indices_shape[0:1], new_shape_shape)) node.out_port(0).data.set_shape(output_indices_shape) - # TODO: implement for constant input indices value + # TODO: implement constant value propogation for common case + if np.array_equal(input_shape_value, output_shape_value) and input_indices_value is not None: + node.out_port(0).data.set_value(input_indices_value) From 42b6441d29c3127bf382c2a8d799875ad03e84d2 Mon Sep 17 00:00:00 2001 From: Roman Kazantsev Date: Mon, 8 Jun 2020 17:32:31 +0500 Subject: [PATCH 29/31] Clean-up graph after sparse_reshape and ConstToResult transformation Signed-off-by: Roman Kazantsev --- .../extensions/back/SpecialNodesFinalization.py | 11 ++++++++++- model-optimizer/extensions/middle/sparse_reshape.py | 13 ++++++++++++- 2 files changed, 22 insertions(+), 2 deletions(-) diff --git a/model-optimizer/extensions/back/SpecialNodesFinalization.py b/model-optimizer/extensions/back/SpecialNodesFinalization.py index 99a88f2bcfc682..d972545807157c 100644 --- a/model-optimizer/extensions/back/SpecialNodesFinalization.py +++ b/model-optimizer/extensions/back/SpecialNodesFinalization.py @@ -154,8 +154,17 @@ def pattern(): @staticmethod def replace_pattern(graph: Graph, match: dict): + const_node = match['const_node'] + const_data_node = match['const_data'] result_node = match['result_node'] - graph.remove_node(result_node.id) + nodes_to_remove = [result_node.id] + + # in case only const data consumer that is the result node, remove the whole sub-graph + if len(const_data_node.out_nodes()) == 1: + nodes_to_remove.append(const_node.id) + nodes_to_remove.append(const_data_node.id) + + graph.remove_node(nodes_to_remove) class NormalizeTI(BackReplacementPattern): diff --git a/model-optimizer/extensions/middle/sparse_reshape.py b/model-optimizer/extensions/middle/sparse_reshape.py index a44bab46111b19..72e4174aa53e58 100644 --- a/model-optimizer/extensions/middle/sparse_reshape.py +++ b/model-optimizer/extensions/middle/sparse_reshape.py @@ -59,10 +59,21 @@ def replace_pattern(self, graph: Graph, match: dict): if not np.array_equal(input_shape_value, output_shape_value): raise Error("Input shape and output shape values must be equal for node {}".format(sparse_reshape.id)) + nodes_to_remove = [sparse_reshape.id] if 0 in sparse_reshape.out_nodes(): sparse_reshape.out_port(0).get_connection().set_source(sparse_reshape.in_port(0).get_source()) + output_data_node = sparse_reshape.out_node(0) + nodes_to_remove.append(output_data_node.id) + else: + input_data_node = sparse_reshape.in_node(0) + nodes_to_remove.append(input_data_node.id) if 1 in sparse_reshape.out_nodes(): sparse_reshape.out_port(1).get_connection().set_source(sparse_reshape.in_port(1).get_source()) + output_data_node = sparse_reshape.out_node(1) + nodes_to_remove.append(output_data_node.id) + else: + input_data_node = sparse_reshape.in_node(1) + nodes_to_remove.append(input_data_node.id) - graph.remove_nodes_from([sparse_reshape.id]) + graph.remove_nodes_from(nodes_to_remove) From 9b5e8dec11bb8aa088639f1811148a8e2ddde83a Mon Sep 17 00:00:00 2001 From: Roman Kazantsev Date: Mon, 8 Jun 2020 17:38:18 +0500 Subject: [PATCH 30/31] Fix clean-up for transformations Signed-off-by: Roman Kazantsev --- model-optimizer/extensions/back/SpecialNodesFinalization.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/model-optimizer/extensions/back/SpecialNodesFinalization.py b/model-optimizer/extensions/back/SpecialNodesFinalization.py index d972545807157c..020ef5f28865d4 100644 --- a/model-optimizer/extensions/back/SpecialNodesFinalization.py +++ b/model-optimizer/extensions/back/SpecialNodesFinalization.py @@ -160,7 +160,7 @@ def replace_pattern(graph: Graph, match: dict): nodes_to_remove = [result_node.id] # in case only const data consumer that is the result node, remove the whole sub-graph - if len(const_data_node.out_nodes()) == 1: + if len(const_node.out_port(0).get_destinations()) == 1: nodes_to_remove.append(const_node.id) nodes_to_remove.append(const_data_node.id) From 954bc6fedf128fce6dae80e20dd22ca86eabd9d1 Mon Sep 17 00:00:00 2001 From: Roman Kazantsev Date: Mon, 8 Jun 2020 17:43:32 +0500 Subject: [PATCH 31/31] Fix clean-up for transformation #2 Signed-off-by: Roman Kazantsev --- model-optimizer/extensions/middle/sparse_reshape.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/model-optimizer/extensions/middle/sparse_reshape.py b/model-optimizer/extensions/middle/sparse_reshape.py index 72e4174aa53e58..5db8b162dcd261 100644 --- a/model-optimizer/extensions/middle/sparse_reshape.py +++ b/model-optimizer/extensions/middle/sparse_reshape.py @@ -60,7 +60,7 @@ def replace_pattern(self, graph: Graph, match: dict): raise Error("Input shape and output shape values must be equal for node {}".format(sparse_reshape.id)) nodes_to_remove = [sparse_reshape.id] - if 0 in sparse_reshape.out_nodes(): + if sparse_reshape.is_out_port_connected(0): sparse_reshape.out_port(0).get_connection().set_source(sparse_reshape.in_port(0).get_source()) output_data_node = sparse_reshape.out_node(0) nodes_to_remove.append(output_data_node.id) @@ -68,7 +68,7 @@ def replace_pattern(self, graph: Graph, match: dict): input_data_node = sparse_reshape.in_node(0) nodes_to_remove.append(input_data_node.id) - if 1 in sparse_reshape.out_nodes(): + if sparse_reshape.is_out_port_connected(1): sparse_reshape.out_port(1).get_connection().set_source(sparse_reshape.in_port(1).get_source()) output_data_node = sparse_reshape.out_node(1) nodes_to_remove.append(output_data_node.id)