Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

[Frontend] Add NNEF frontend #17053

Open
wants to merge 8 commits into
base: main
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
The table of contents is too big for display.
Diff view
Diff view
  •  
  •  
  •  
4 changes: 4 additions & 0 deletions docker/Dockerfile.ci_cpu
Original file line number Diff line number Diff line change
Expand Up @@ -150,6 +150,10 @@ RUN bash /install/ubuntu_install_libxsmm.sh
COPY install/ubuntu_install_onnx.sh /install/ubuntu_install_onnx.sh
RUN bash /install/ubuntu_install_onnx.sh

# NNEF
COPY install/ubuntu_install_nnef.sh /install/ubuntu_install_nnef.sh
RUN bash /install/ubuntu_install_nnef.sh

# AArch64 Architecture Envelope Model (AEM)
COPY install/ubuntu_install_aprofile_aem.sh /install
RUN bash /install/ubuntu_install_aprofile_aem.sh
Expand Down
5 changes: 4 additions & 1 deletion docker/Dockerfile.ci_gpu
Original file line number Diff line number Diff line change
Expand Up @@ -17,7 +17,7 @@

# CI docker GPU env
# tag: v0.60
FROM nvidia/cuda:12.4.1-cudnn-devel-ubuntu22.04
FROM nvidia/cuda:11.8.0-cudnn8-devel-ubuntu22.04

COPY utils/apt-install-and-clear.sh /usr/local/bin/apt-install-and-clear

Expand Down Expand Up @@ -118,6 +118,9 @@ RUN bash /install/ubuntu_install_paddle.sh
COPY install/ubuntu_install_oneflow.sh /install/ubuntu_install_oneflow.sh
RUN bash /install/ubuntu_install_oneflow.sh

COPY install/ubuntu_install_nnef.sh /install/ubuntu_install_nnef.sh
RUN bash /install/ubuntu_install_nnef.sh

# Rust env (build early; takes a while)
COPY install/ubuntu_install_rust.sh /install/ubuntu_install_rust.sh
RUN bash /install/ubuntu_install_rust.sh
Expand Down
25 changes: 25 additions & 0 deletions docker/install/ubuntu_install_nnef.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,25 @@
#!/bin/bash
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.

set -e
set -u
set -o pipefail

pip3 install \
nnef_tools==1.0.5 \
nnef==1.0.5
21 changes: 21 additions & 0 deletions python/tvm/relax/frontend/nnef/__init__.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,21 @@
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.

"""
NNEF frontend for converting graphs into Relax IRModels.
"""
from .nnef_frontend import from_nnef
307 changes: 307 additions & 0 deletions python/tvm/relax/frontend/nnef/nnef_frontend.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,307 @@
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.

"""NNEF: Neural Network Exchange Format frontend for TVM relay"""
agoston-mc marked this conversation as resolved.
Show resolved Hide resolved
import os
import typing
import nnef
import numpy as np

import tvm
from tvm import relax
from tvm.ir import IRModule
from tvm.relax import expr as tvm_expr

from .nnef_ops import _get_converter_map


def get_type(elem_type: str):
"""
Gives numpy style type for nnef primitive types, uses x32 versions.

:param elem_type: string, (scalar, integer, logical, string)
:return: returns numpy dtype equivalent (float32, int32, bool, string)
"""
if elem_type == "scalar":
return "float32"
if elem_type == "integer":
return "int32"
if elem_type == "logical":
return "bool"
if elem_type == "string":
return "string"
raise TypeError(f'Type "{elem_type}" is not implemented')


# Converter class
class NNEFConverter:
"""
Helper class for class level attributes, for conversion of NNEF model.
Public method to use is from_nnef.

Parameters
----------

keep_params_in_input : bool, optional
If this parameter is true, the nnef variables will be converted to
constants, and be embedded into the relay model, allowing optimizations
at compile time.
If False the params will have to be added as inputs,
the model can't load them automatically

"""

def __init__(self, keep_params_in_input=False):
self._nodes = {}
self._consts = {}
self._inputs = {}
self._num_inputs = 0
self._params = {}
self._num_params = 0
self._keep_params_in_input = keep_params_in_input
self._bb = relax.BlockBuilder()

def from_nnef(self, graph: nnef.Graph) -> tvm.IRModule:
"""
Convert an NNEF model into an equivalent TVM Relay IRModule.
agoston-mc marked this conversation as resolved.
Show resolved Hide resolved

Parameters
----------
graph : nnef.Graph
An NNEF Graph object that was imported with nnef.load_graph.
Shapes should be inferred by nnef.infer_shapes on graph beforehand.

Returns
-------
mod : tvm.IRModule
The relay module for compilation

params : dict of str to tvm.nd.NDArray
The parameter dictionary to be used

"""
with self._bb.function("main"):
with self._bb.dataflow():
self._parse_inputs(graph)
self._construct_nodes(graph)

outputs = [self._nodes[n] for n in graph.outputs]
outputs = outputs[0] if len(outputs) == 1 else tvm_expr.Tuple(outputs)

output_var = self._bb.emit_output(outputs)

func_attrs = {"num_input": self._num_inputs}

input_list = [value for value in self._inputs.values() if isinstance(value, relax.Var)]

if self._keep_params_in_input and self._params:
param_var_list, param_value_list = map(list, zip(*self._params.values()))
input_list.append(param_var_list)
func_attrs["params"] = param_value_list

self._bb.emit_func_output(output_var, input_list)

relax_mod = self._bb.get()
relax_mod["main"] = relax_mod["main"].with_attrs(func_attrs)
return relax_mod

def _parse_inputs(self, graph):
"""Save inputs into class from inputs attrib of graph"""
for inp in graph.inputs:
self._num_inputs += 1
tensor = graph.tensors[inp]
self._nodes[inp] = self._new_var(inp, shape=tensor.shape, dtype=get_type(tensor.dtype))
self._inputs[inp] = self._nodes[inp]

def _construct_nodes(self, graph):
"""Construct TVM relay calls from every operation of the nnef graph"""
for op in graph.operations:
if op.name == "external":
# externals are handled as input, not needed,
# but nnef treats them as operations as well
continue

if op.name == "variable":
self._set_variable(graph.tensors[op.outputs["output"]])

elif op.name == "constant":
self._set_const(op)

else:
# every other operator can be grouped more easily,
# as it does not need self for conversion
self._set_operator(op)

def _set_operator(self, node):
self._set_literal_inputs(node)
inputs = []
for ink, inv in node.inputs.items():
if isinstance(inv, list):
for i, linv in enumerate(inv):
if linv in self._nodes.keys():
inputs.append(self._nodes[linv])
else: # handle literal inputs
name = f"{node.name}_{ink}_{i}"
assert name in self._nodes, f"{name} has not been properly handled"
inputs.append(self._nodes[name])

else:
if inv in self._nodes.keys():
inputs.append(self._nodes[inv])
else: # handle literal inputs
name = f"{node.name}_{ink}"
assert name in self._nodes, f"{name} has not been properly handled"
inputs.append(self._nodes[name])

converted = self._get_relay_op_call(node.name, inputs, node.attribs)
converted = self._bb.normalize(converted)

if not isinstance(converted.struct_info, relax.TupleStructInfo):
outputs_num = 1
else:
outputs_num = len(converted.struct_info.fields)

if outputs_num == 1:
# check if the singular ret val is a list of only one element
ret_val = list(node.outputs.values())[0]
if isinstance(ret_val, list):
self._nodes[ret_val[0]] = converted
else:
self._nodes[ret_val] = converted
else:
for i, out in zip(range(outputs_num), node.outputs["values"]):
self._nodes[out] = converted[i]

def _set_const(self, node):
"""Create a tvm.relay.Constant from a nnef constant tensor"""
name = node.outputs["output"]
data = node.attribs["value"]
shape = node.attribs["shape"]
if len(data) == 1:
data = np.full(shape, data, dtype=get_type(node.dtype))
else:
data = np.array(data, dtype=get_type(node.dtype))
self._consts[name] = tvm_expr.const(data)
self._nodes[name] = self._consts[name]

def _set_variable(self, tensor):
"""Create a tvm.relay.Var (or Constant) from a nnef variable tensor"""
tens_data = tensor.data
if not self._keep_params_in_input:
self._consts[tensor.name] = tvm_expr.const(tens_data)
self._nodes[tensor.name] = self._consts[tensor.name]
else:
var = self._new_var(tensor.name, shape=tensor.shape, dtype=get_type(tensor.dtype))
self._nodes[tensor.name] = var
self._params[tensor.name] = (var, tvm.nd.array(tens_data))

def _set_literal_inputs(self, node):
"""Checks if node has literal inputs and saves them into a tvm.relay.Constant.
naming as {node.name}_{input field name}"""
for field_name, value in node.inputs.items():
if isinstance(value, list):
for v in value:
if v not in self._nodes.keys():
self._nodes[f"{node.name}_{v}"] = tvm_expr.const(v)

else:
if value not in self._nodes.keys():
self._nodes[f"{node.name}_{field_name}"] = tvm_expr.const(value)

def _get_relay_op_call(self, name, inputs, attrs):
agoston-mc marked this conversation as resolved.
Show resolved Hide resolved
"""Returns the tvm.Call equivalent to the nnef operator"""
conv_map = _get_converter_map()
if name in conv_map:

call = conv_map[name](self._bb, *inputs, **attrs)
else:
# This error is reached if NNEF is expanded with additional ops
raise NotImplementedError(
f"Operator {name} is not implemented, as {name} has been added after 1.0.5."
)
return call

def _infer_type(self, val):
if isinstance(val, bool):
return "bool", True
if isinstance(val, float):
return "float32", True
if isinstance(val, int):
return "int32", True
if isinstance(val, str):
# the string vals can be names of nodes in some of the cases
if isinstance(val, nnef.Identifier):
if val in self._nodes.keys():
node = self._nodes[val]
if isinstance(node, tvm_expr.Var):
return node.type_annotation.dtype, False
if isinstance(node, tvm_expr.Constant):
return node.data.dtype, False
if isinstance(node, tvm_expr.Call):
return node.checked_type.dtype, False
raise Exception(
f"{val} has not been loaded into the model "
"but it should have been, as a var or call."
)
return "string", True

raise TypeError(f'Value "{val}" is not a recognized type')

def _new_var(self, name, shape, dtype="float32"):
return relax.Var(
name_hint=name,
struct_info=relax.TensorStructInfo(shape=shape, dtype=dtype),
)


def from_nnef(
model: typing.Union[str, os.PathLike, nnef.Graph],
keep_params_in_input: bool = False,
) -> IRModule:
"""
Convert an NNEF model into an equivalent TVM Relay IRModule.
agoston-mc marked this conversation as resolved.
Show resolved Hide resolved


Parameters
----------
model : os.PathLike or str or nnef.Graph
Path to an NNEF model directory, containing the graph.nnef (and weight files)

keep_params_in_input : bool, optional
If this parameter is true, the nnef variables will be converted to
constants, and be embedded into the relax model, allowing optimizations
at compile time.
If False the params will have to be added as inputs,
the model can't load them automatically

Returns
-------
mod : tvm.IRModule
The relay module for compilation

params : dict of str to tvm.nd.NDArray
The parameter dictionary to be used
"""
conv_clss = NNEFConverter(keep_params_in_input)

if not isinstance(model, nnef.Graph):
model = nnef.load_graph(model)

# fills in the nnef graph's shape information
nnef.infer_shapes(model)

return conv_clss.from_nnef(graph=model)
Loading
Loading