Leave possibility to use a dictionnary for onnx export (#944)

Signed-off-by: Ella Charlaix <[email protected]>
intel · Jun 7, 2023 · 17b6425 · 17b6425
1 parent ee59a32
commit 17b6425
Showing 1 changed file with 11 additions and 12 deletions.
diff --git a/neural_compressor/experimental/export/torch2onnx.py b/neural_compressor/experimental/export/torch2onnx.py
@@ -30,16 +30,14 @@
 ort = LazyImport('onnxruntime')
 ortq = LazyImport('onnxruntime.quantization')
 
-def _prepare_intputs(pt_model, input_names, example_inputs):
+def _prepare_inputs(pt_model, input_names, example_inputs):
     """Prepare input_names and example_inputs."""
-    if input_names is None and \
-      (isinstance(example_inputs, dict) or isinstance(example_inputs, UserDict)): # pragma: no cover
-        input_names = list(example_inputs.keys())
-        example_inputs = list(example_inputs.values())
-    elif isinstance(example_inputs, dict) or isinstance(example_inputs, UserDict):
-        example_inputs = list(example_inputs.values())
+    if isinstance(example_inputs, dict) or isinstance(example_inputs, UserDict):
+        input_names = input_names or list(example_inputs.keys())
+        if isinstance(example_inputs, UserDict):
+            example_inputs = dict(example_inputs)
     # match input_names with inspected input_order, especailly for bert in hugginface.
-    if input_names and len(input_names) > 1:
+    elif input_names and len(input_names) > 1:
         import inspect
         input_order = inspect.signature(pt_model.forward).parameters.keys()
         flag = [name in input_order for name in input_names] # whether should be checked
@@ -53,6 +51,7 @@ def _prepare_intputs(pt_model, input_names, example_inputs):
                     new_example_inputs.append(example_inputs[id])
             input_names = new_input_names
             example_inputs = new_example_inputs
+        example_inputs = input2tuple(example_inputs)
     return input_names, example_inputs
 
 
@@ -86,12 +85,12 @@ def torch_to_fp32_onnx(
     assert is_int8_model(pt_model) == False, "The fp32 model is replaced during quantization. " + \
         "please customize a eval_func when quantizing, if not, such as `lambda x: 1`."
 
-    input_names, example_inputs = _prepare_intputs(pt_model, input_names, example_inputs)
+    input_names, example_inputs = _prepare_inputs(pt_model, input_names, example_inputs)
 
     with torch.no_grad():
         torch.onnx.export(
             pt_model,
-            input2tuple(example_inputs),
+            example_inputs,
             save_path, 
             opset_version=opset_version,
             input_names=input_names,
@@ -148,7 +147,7 @@ def torch_to_int8_onnx(
         "1. export FP32 PyTorch model to FP32 ONNX model. " \
         "2. use FP32 ONNX model as the input model for post training dynamic quantization."
 
-    input_names, example_inputs = _prepare_intputs(pt_model, input_names, example_inputs)
+    input_names, example_inputs = _prepare_inputs(pt_model, input_names, example_inputs)
 
     def model_wrapper(model_fn):
         # export doesn't support a dictionary output, so manually turn it into a tuple
@@ -193,4 +192,4 @@ def wrapper(*args, **kwargs):
         info = "The INT8 ONNX Model exported to path: {0}".format(save_path)
         logger.info("*"*len(info))
         logger.info(info)
-        logger.info("*"*len(info))
+        logger.info("*"*len(info))