Support PyTorch FX diagnosis in Neural Insights (#1190)

Signed-off-by: bmyrcha <[email protected]> Co-authored-by: Cheng, Penghui <[email protected]> Co-authored-by: Agata Radys <[email protected]>
intel · Sep 12, 2023 · 74a785e · 74a785e
1 parent 8d2bf27
commit 74a785e
Show file tree

Hide file tree

Showing 52 changed files with 883 additions and 262 deletions.
diff --git a/.azure-pipelines/scripts/codeScan/pylint/pylint.sh b/.azure-pipelines/scripts/codeScan/pylint/pylint.sh
@@ -52,7 +52,7 @@ elif [ "${scan_module}" = "neural_insights" ]; then
 fi
 
 python -m pylint -f json --disable=R,C,W,E1129 --enable=line-too-long --max-line-length=120 --extension-pkg-whitelist=numpy --ignored-classes=TensorProto,NodeProto \
---ignored-modules=tensorflow,torch,torch.quantization,torch.tensor,torchvision,fairseq,mxnet,onnx,onnxruntime,intel_extension_for_pytorch,intel_extension_for_tensorflow /neural-compressor/${scan_module} \
+--ignored-modules=tensorflow,torch,torch.quantization,torch.tensor,torchvision,fairseq,mxnet,onnx,onnxruntime,intel_extension_for_pytorch,intel_extension_for_tensorflow,torchinfo /neural-compressor/${scan_module} \
 >$log_dir/pylint.json
 
 exit_code=$?

diff --git a/neural_compressor/adaptor/pytorch.py b/neural_compressor/adaptor/pytorch.py
@@ -968,8 +968,10 @@ def eval_func(self, model, dataloader, postprocess, metrics, measurer, iteration
             for idx, input in enumerate(dataloader):
                 if isinstance(input, dict) or isinstance(input, UserDict):
                     if not self.benchmark:
-                        assert "label" in input, "The dataloader must include label to measure the metric!"
-                        label = input["label"].to("cpu")
+                        assert (
+                            "label" in input or "labels" in input
+                        ), "The dataloader must include label to measure the metric!"
+                        label = input["label"].to("cpu") if "label" in input else input["labels"].to("cpu")
                 elif not self.benchmark:
                     assert False, "The dataloader must include label to measure the metric!"
 

diff --git a/neural_compressor/benchmark.py b/neural_compressor/benchmark.py
@@ -518,19 +518,23 @@ def fit(model, conf, b_dataloader=None, b_func=None):
         set_env_var("NC_ENV_CONF", True, overwrite_existing=True)
 
     if conf.diagnosis and os.environ.get("NC_ENV_CONF", None) in [None, "False"]:
-        logger.info("Start to run Profiling")
-        ni_workload_id = register_neural_insights_workload(
-            workload_location=os.path.abspath(os.path.abspath(options.workspace)),
-            model=wrapped_model,
-            workload_mode="benchmark",
-        )
-        try:
-            update_neural_insights_workload(ni_workload_id, "wip")
-            profile(wrapped_model, conf, b_dataloader)
-            update_neural_insights_workload(ni_workload_id, "success")
-        except Exception as e:
-            logger.error(e)
-            update_neural_insights_workload(ni_workload_id, "failure")
+        if b_dataloader is not None:
+            logger.info("Start to run Profiling")
+            ni_workload_id = register_neural_insights_workload(
+                workload_location=os.path.abspath(os.path.abspath(options.workspace)),
+                model=wrapped_model,
+                workload_mode="benchmark",
+                workload_name=conf.ni_workload_name,
+            )
+            try:
+                update_neural_insights_workload(ni_workload_id, "wip")
+                profile(wrapped_model, conf, b_dataloader=b_dataloader)
+                update_neural_insights_workload(ni_workload_id, "success")
+            except Exception as e:
+                logger.error(e)
+                update_neural_insights_workload(ni_workload_id, "failure")
+        else:
+            logger.warning("Profiling is only supported with b_dataloader.")
 
     logger.info("Start to run Benchmark.")
     if os.environ.get("NC_ENV_CONF") == "True":

diff --git a/neural_compressor/config.py b/neural_compressor/config.py
@@ -302,6 +302,7 @@ def __init__(
         inter_num_of_threads=None,
         intra_num_of_threads=None,
         diagnosis=False,
+        ni_workload_name="profiling",
     ):
         """Init a BenchmarkConfig object."""
         self.inputs = inputs
@@ -316,6 +317,7 @@ def __init__(
         self.inter_num_of_threads = inter_num_of_threads
         self.intra_num_of_threads = intra_num_of_threads
         self.diagnosis = diagnosis
+        self.ni_workload_name = ni_workload_name
         self._framework = None
 
     def keys(self):
@@ -464,6 +466,17 @@ def diagnosis(self, diagnosis):
         if _check_value("diagnosis", diagnosis, bool):
             self._diagnosis = diagnosis
 
+    @property
+    def ni_workload_name(self):
+        """Get Neural Insights workload name."""
+        return self._ni_workload_name
+
+    @ni_workload_name.setter
+    def ni_workload_name(self, ni_workload_name):
+        """Set Neural Insights workload name."""
+        if _check_value("ni_workload_name", ni_workload_name, str):
+            self._ni_workload_name = ni_workload_name
+
     @property
     def model_name(self):
         """Get model name."""
@@ -801,6 +814,7 @@ def __init__(
         accuracy_criterion=accuracy_criterion,
         tuning_criterion=tuning_criterion,
         diagnosis=False,
+        ni_workload_name="quantization",
     ):
         """Initialize _BaseQuantizationConfig class."""
         self.inputs = inputs
@@ -822,6 +836,7 @@ def __init__(
         self.quant_level = quant_level
         self._framework = None
         self.diagnosis = diagnosis
+        self.ni_workload_name = ni_workload_name
         self._example_inputs = example_inputs
 
     @property
@@ -1259,6 +1274,8 @@ class PostTrainingQuantConfig(_BaseQuantizationConfig):
                             Please refer to docstring of AccuracyCriterion class.
         diagnosis(bool): This flag indicates whether to do diagnosis.
                            Default value is False.
+        ni_workload_name: Custom workload name for Neural Insights diagnosis workload.
+                           Default value is 'quantization'.
 
     Example::
 
@@ -1293,6 +1310,7 @@ def __init__(
         accuracy_criterion=accuracy_criterion,
         tuning_criterion=tuning_criterion,
         diagnosis=False,
+        ni_workload_name="quantization",
     ):
         """Init a PostTrainingQuantConfig object."""
         super().__init__(
@@ -1313,9 +1331,13 @@ def __init__(
             accuracy_criterion=accuracy_criterion,
             tuning_criterion=tuning_criterion,
             diagnosis=diagnosis,
+            ni_workload_name=ni_workload_name,
         )
         self.approach = approach
         self.diagnosis = diagnosis
+        self.ni_workload_name = ni_workload_name
+        if self.diagnosis:
+            self.tuning_criterion.max_trials = 1
 
     @property
     def approach(self):
@@ -1343,6 +1365,17 @@ def diagnosis(self, diagnosis):
         if _check_value("diagnosis", diagnosis, bool):
             self._diagnosis = diagnosis
 
+    @property
+    def ni_workload_name(self):
+        """Get Neural Insights workload name."""
+        return self._ni_workload_name
+
+    @ni_workload_name.setter
+    def ni_workload_name(self, ni_workload_name):
+        """Set Neural Insights workload name."""
+        if _check_value("ni_workload_name", ni_workload_name, str):
+            self._ni_workload_name = ni_workload_name
+
 
 class QuantizationAwareTrainingConfig(_BaseQuantizationConfig):
     """Config Class for Quantization Aware Training.

diff --git a/neural_compressor/model/torch_model.py b/neural_compressor/model/torch_model.py
@@ -48,6 +48,7 @@ def __init__(self, model, **kwargs):
         torch.nn.Module.__init__(self)
         self._model = model
         assert isinstance(model, torch.nn.Module), "model should be pytorch nn.Module."
+        self._model_path = None if not isinstance(model, str) else model
         self.handles = []
         self.tune_cfg = None
         self.q_config = None
@@ -99,6 +100,16 @@ def model(self, model):
         """Setter to model."""
         self._model = model
 
+    @property
+    def model_path(self):
+        """Return model path."""
+        return self._model_path
+
+    @model_path.setter
+    def model_path(self, path):
+        """Set model path."""
+        self._model_path = path
+
     @property
     def fp32_model(self):
         """Getter to model."""

diff --git a/neural_compressor/quantization.py b/neural_compressor/quantization.py
@@ -216,6 +216,7 @@ def eval_func(model):
                     workload_location=os.path.abspath(options.workspace),
                     model=wrapped_model,
                     workload_mode="quantization",
+                    workload_name=conf.ni_workload_name,
                 )
                 if ni_workload_id:
                     update_neural_insights_workload(ni_workload_id, "wip")

diff --git a/neural_compressor/utils/neural_insights_utils.py b/neural_compressor/utils/neural_insights_utils.py
@@ -14,23 +14,25 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 """Neural Insights utils functions."""
+import os
 from typing import Any, Optional
 
-from neural_compressor.model.onnx_model import ONNXModel
 from neural_compressor.utils import logger
 
 
 def register_neural_insights_workload(
     workload_location: str,
     model: Any,
     workload_mode: str,
+    workload_name: str,
 ) -> Optional[str]:
     """Register workload to Neural Insights.
 
     Args:
         workload_location: path to workload directory
         model: Neural Compressor's model instance to be registered
         workload_mode: workload mode
+        workload_name: Name of the workload
 
     Returns:
         String with Neural Insight workload UUID if registered else None
@@ -46,22 +48,15 @@ def register_neural_insights_workload(
         except ValueError:
             raise Exception(f"Workload mode '{workload_mode}' is not supported.")
 
-        model_path = None
-        if isinstance(model.model_path, str):
-            model_path: str = os.path.abspath(model.model_path)
-        elif isinstance(model, ONNXModel):
-            import onnx
-
-            model_path: str = os.path.join(workload_location, "input_model.onnx")
-            os.makedirs(workload_location, exist_ok=True)
-            onnx.save(model.model, model_path)
-        assert isinstance(model_path, str), "Model path not detected"
+        model_path, model_summary_file = get_model_path(model, workload_location)
 
         neural_insights = NeuralInsights(workdir_location=WORKDIR_LOCATION)
         ni_workload_uuid = neural_insights.add_workload(
             workload_location=workload_location,
             workload_mode=mode,
             model_path=model_path,
+            workload_name=workload_name,
+            model_summary_file=model_summary_file,
         )
         logger.info(f"Registered {workload_mode} workload to Neural Insights.")
         return ni_workload_uuid
@@ -123,3 +118,57 @@ def update_neural_insights_workload_accuracy_data(
         logger.info("Neural Insights not found.")
     except Exception as err:
         logger.warning(f"Could not update workload accuracy data: {err}.")
+
+
+def get_model_path(model: Any, workload_location: str) -> Any:
+    """Get model path."""
+    from neural_insights.utils.exceptions import ClientErrorException
+    from neural_insights.utils.utils import check_module
+
+    model_path = None
+    model_summary_file = None
+    onnx_installed = False
+    pytorch_installed = False
+
+    try:
+        check_module("onnx")
+        onnx_installed = True
+    except ClientErrorException:
+        pass
+
+    try:
+        check_module("torch")
+        pytorch_installed = True
+    except ClientErrorException:
+        pass
+
+    if isinstance(model.model_path, str):
+        return os.path.abspath(model.model_path)
+    if onnx_installed:
+        import onnx
+
+        from neural_compressor.model.onnx_model import ONNXModel
+
+        if isinstance(model, ONNXModel):
+            model_path: str = os.path.join(workload_location, "input_model.onnx")
+            os.makedirs(workload_location, exist_ok=True)
+            onnx.save(model.model, model_path)
+            return model_path, model_summary_file
+    if pytorch_installed:
+        import torch
+        from torchinfo import summary
+
+        from neural_compressor.model.torch_model import PyTorchModel
+
+        if isinstance(model, PyTorchModel):
+            model_path: str = os.path.join(workload_location, "input_model.pt")
+            os.makedirs(workload_location, exist_ok=True)
+            torch.save(model.model.state_dict(), model_path)
+
+            model_stats = summary(model.model, depth=5, verbose=0)
+            summary_str = str(model_stats)
+            model_summary_file = os.path.join(workload_location, "model_summary.txt")
+            with open(model_summary_file, "w", encoding="utf-8") as summary_file:
+                summary_file.write(summary_str)
+            return model_path, model_summary_file
+    assert isinstance(model_path, str), "Model path not detected"
diff --git a/neural_compressor/utils/utility.py b/neural_compressor/utils/utility.py
@@ -961,6 +961,9 @@ def print_op_list(workload_location: str):
         None
     """
     minmax_file_path = os.path.join(workload_location, "inspect_saved", "activation_min_max.pkl")
+    if not os.path.exists(minmax_file_path):
+        logging.getLogger("neural_compressor").warning("Could not find activation min max data.")
+        return
     input_model_tensors = get_tensors_info(
         workload_location,
         model_type="input",

diff --git a/neural_insights/components/diagnosis/diagnosis.py b/neural_insights/components/diagnosis/diagnosis.py
@@ -24,6 +24,7 @@
 from neural_insights.components.model.model import Model
 from neural_insights.components.workload_manager.workload import Workload
 from neural_insights.utils.exceptions import ClientErrorException, InternalException
+from neural_insights.utils.logger import log
 from neural_insights.utils.utils import check_module
 
 
@@ -69,7 +70,17 @@ def load_quantization_config(self) -> dict:
             "cfg.pkl",
         )
         if not os.path.exists(config_path):
-            raise ClientErrorException("Could not find config data for specified optimization.")
+            log.debug("Could not find config data for specified optimization. Getting data from inspect files.")
+            input_model_tensors: dict = self.get_tensors_info(model_type="input")["activation"][0]
+            optimized_model_tensors: dict = self.get_tensors_info(model_type="optimized")["activation"][0]
+            common_ops = list(set(input_model_tensors.keys()) & set(optimized_model_tensors.keys()))
+            config_data = {
+                "op": {},
+            }
+            for op in common_ops:
+                config_data["op"].update({(op,): {}})
+            return config_data
+
         with open(config_path, "rb") as config_pickle:
             config_data = pickle.load(config_pickle)
         return config_data
@@ -79,23 +90,37 @@ def get_op_list(self) -> List[dict]:
         check_module("numpy")
         import numpy as np
 
+        op_list: List[dict] = []
+
+        input_model_tensors: dict = self.get_tensors_info(model_type="input")["activation"][0]
+        optimized_model_tensors: dict = self.get_tensors_info(model_type="optimized")["activation"][0]
+
         minmax_file_path = os.path.join(
             self.workload_location,
             "inspect_saved",
             "activation_min_max.pkl",
         )
-        with open(minmax_file_path, "rb") as min_max_file:
-            min_max_data: dict = pickle.load(min_max_file)
 
-        op_list: List[dict] = []
-        input_model_tensors: dict = self.get_tensors_info(model_type="input")["activation"][0]
-        optimized_model_tensors: dict = self.get_tensors_info(model_type="optimized")["activation"][0]
+        try:
+            with open(minmax_file_path, "rb") as min_max_file:
+                min_max_data: dict = pickle.load(min_max_file)
+        except FileNotFoundError:
+            log.debug("Could not find minmax file.")
+            common_ops = list(set(input_model_tensors.keys()) & set(optimized_model_tensors.keys()))
+            min_max_data = dict(zip(common_ops, [{"min": None, "max": None}] * len(common_ops)))
+
         for op_name, min_max in min_max_data.items():
             mse = self.calculate_mse(op_name, input_model_tensors, optimized_model_tensors)
             if mse is None or np.isnan(mse):
                 continue
-            min = float(min_max.get("min", None))
-            max = float(min_max.get("max", None))
+            min = min_max.get("min", None)
+            max = min_max.get("max", None)
+
+            if min is not None:
+                min = float(min)
+            if max is not None:
+                max = float(max)
+
             op_entry = OpEntry(op_name, mse, min, max)
             op_list.append(op_entry.serialize())
         return op_list

diff --git a/neural_insights/components/diagnosis/factory.py b/neural_insights/components/diagnosis/factory.py
@@ -15,6 +15,7 @@
 """Diagnosis class factory."""
 from neural_insights.components.diagnosis.diagnosis import Diagnosis
 from neural_insights.components.diagnosis.onnx_diagnosis.onnxrt_diagnosis import OnnxRtDiagnosis
+from neural_insights.components.diagnosis.pytorch_diagnosis.pytorch_diagnosis import PyTorchDiagnosis
 from neural_insights.components.diagnosis.tensorflow_diagnosis.tensorflow_diagnosis import TensorflowDiagnosis
 from neural_insights.components.workload_manager.workload import Workload
 from neural_insights.utils.consts import Frameworks
@@ -33,6 +34,7 @@ def get_diagnosis(
         diagnosis_map = {
             Frameworks.ONNX: OnnxRtDiagnosis,
             Frameworks.TF: TensorflowDiagnosis,
+            Frameworks.PT: PyTorchDiagnosis,
         }
         diagnosis = diagnosis_map.get(workload.framework, None)
         if diagnosis is None: