openvinotoolkit · dorloff · Oct 7, 2021 · Oct 4, 2021 · Oct 6, 2021 · Oct 6, 2021
@@ -653,11 +653,18 @@ class DataQuantizer<Desc, InferenceEngine::WeightableLayer *> : public DataQuant
 
     void operator()(InferenceEngine::WeightableLayer *wl, const FakeQuant&) const {
         auto quantData = InferenceEngine::getInjectedData<QuantizedLayerParams>(*wl);
-        IE_ASSERT(quantData->_weights_quant.IsStatsSet());
-        if (quantData->_weights_quant.GetLevels() <= std::numeric_limits<uint8_t>::max()) {
-            quantizeWeightsBiases<FakeQuantI8>(FakeQuantI8(), wl, Quant<FakeQuantI8>());
+        if (quantData->_weights_quant.IsStatsSet()) {
+            if (quantData->_weights_quant.GetLevels() <= std::numeric_limits<uint8_t>::max()) {
+                quantizeWeightsBiases<FakeQuantI8>(FakeQuantI8(), wl, Quant<FakeQuantI8>());
+            } else {
+                quantizeWeightsBiases<FakeQuantI16>(FakeQuantI16(), wl, Quant<FakeQuantI16>());
+            }
         } else {
-            quantizeWeightsBiases<FakeQuantI16>(FakeQuantI16(), wl, Quant<FakeQuantI16>());
+            if (std::is_same<typename Desc::OptionalType, FakeQuant>()) {
+                THROW_GNA_EXCEPTION << "Infinite recursion. The type Desc::OptionalType is equal FakeQuant.";
+            }
+
+            (*this)(wl, typename Desc::OptionalType());
         }
     }
 };

@@ -1354,6 +1354,12 @@ class ScaleFactorCalculator {
                 } else {
                     return frontend::FakeQuantI16().getWeightsPrecision().size();
                 }
+            } else {
+                if (!info.isSynthetic()) {
+                    gnawarn() << "The layer (" << ptr->name << ") has not quantization statistics\n";
+                }
+
+                return GetOptionalWeightsBytesSize();
             }
         }
 

@@ -344,6 +344,10 @@ class LayerInfo {
         return isConcatAlignFilter() || isSyntheticScaleShift() || isCropAffined();
     }
 
+    bool isSynthetic() const noexcept {
+        return isConcatAlignFilter() || isSyntheticScaleShift() || isConvolutionFilter() || isAffineFilter();
+    }
+
     size_t paddingSize() const {
         static InferenceEngine::details::caseless_set<std::string> layersWithPossiblePadding = {"FullyConnected",
                                                                         "InnerProduct",

@@ -0,0 +1,111 @@
+// Copyright (C) 2021 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <tuple>
+#include <vector>
+#include <string>
+#include <memory>
+
+#include "shared_test_classes/base/layer_test_utils.hpp"
+#include "ngraph_functions/builders.hpp"
+#include "ngraph_functions/utils/ngraph_helpers.hpp"
+
+namespace SubgraphTestsDefinitions {
+
+typedef std::tuple<
+        InferenceEngine::Precision,        // Net precision
+        std::vector<size_t>,               // Input shape;
+        std::vector<size_t>,               // Constant shape;
+        LayerTestsUtils::TargetDevice,     // Device name
+        std::map<std::string, std::string> // Additional backend configuration and alis name to it
+> WeighableLayerWithoutFqParamsSet;
+
+/*
+ * This test emulates cases in which the ConcatAlignFilter layer is created and the model has FakeQuantize layers.
+ */
+class WeighableLayerWithoutFqTest :
+    public testing::WithParamInterface<WeighableLayerWithoutFqParamsSet>,
+    virtual public LayerTestsUtils::LayerTestsCommon {
+public:
+    static std::string getTestCaseName(const testing::TestParamInfo<WeighableLayerWithoutFqParamsSet>& obj) {
+        InferenceEngine::Precision netPrecision;
+        std::string targetDevice;
+        std::map<std::string, std::string> config;
+        std::vector<size_t> inputShape;
+        std::vector<size_t> constantShape;
+        std::tie(netPrecision, constantShape, inputShape, targetDevice, config) = obj.param;
+
+        std::ostringstream result;
+        result << "netPRC=" << netPrecision.name() << "_";
+        result << "trgDev=" << targetDevice;
+        for (auto const& configItem : config) {
+            result << "_configItem=" << configItem.first << "_" << configItem.second;
+        }
+        return result.str();
+    }
+
+protected:
+    void SetUp() override {
+        std::map<std::string, std::string> config;
+        InferenceEngine::Precision netPrecision;
+        std::vector<size_t> inputShape;
+        std::vector<size_t> constantShape;
+        std::tie(netPrecision, constantShape, inputShape, targetDevice, config) = this->GetParam();
+        configuration.insert(config.begin(), config.end());
+
+        auto ngPrc = FuncTestUtils::PrecisionUtils::convertIE2nGraphPrc(netPrecision);
+        auto params = ngraph::builder::makeParams(ngPrc, {inputShape});
+        auto fq1 = std::make_shared<ngraph::opset8::FakeQuantize>(
+            params[0],
+            ngraph::opset8::Constant::create(ngraph::element::f32, {1}, {1.}),
+            ngraph::opset8::Constant::create(ngraph::element::f32, {1}, {1.}),
+            ngraph::opset8::Constant::create(ngraph::element::f32, {1}, {1.}),
+            ngraph::opset8::Constant::create(ngraph::element::f32, {1}, {1.}),
+            255);
+        auto constant = ngraph::builder::makeConstant(ngPrc, constantShape, std::vector<float>{}, true);
+        auto fq2 = std::make_shared<ngraph::opset8::FakeQuantize>(
+            constant,
+            ngraph::opset8::Constant::create(ngraph::element::f32, {1}, {1}),
+            ngraph::opset8::Constant::create(ngraph::element::f32, {1}, {1.}),
+            ngraph::opset8::Constant::create(ngraph::element::f32, {1}, {1.}),
+            ngraph::opset8::Constant::create(ngraph::element::f32, {1}, {1.}),
+            255);
+        auto concat = ngraph::builder::makeConcat({fq1, fq2}, 0);
+        function = std::make_shared<ngraph::Function>(concat, params, "WeighableLayerWithoutFq");
+    }
+}; // class WeighableLayerWithoutFqTest
+
+TEST_P(WeighableLayerWithoutFqTest, CompareWithRefs) {
+    Run();
+}
+
+namespace {
+const std::vector<InferenceEngine::Precision> netPrecisions = {
+    InferenceEngine::Precision::FP32,
+    InferenceEngine::Precision::FP16,
+};
+
+const std::vector<std::vector<size_t>> inputShapes = {
+    {{1, 5}}
+};
+
+const std::vector<std::vector<size_t>> constantShapes = {
+    {{16, 5}}
+};
+
+const std::vector<std::map<std::string, std::string>> configs = {
+    {{"GNA_DEVICE_MODE", "GNA_SW_FP32"}},
+    {{"GNA_DEVICE_MODE", "GNA_SW_EXACT"}}
+};
+
+INSTANTIATE_TEST_SUITE_P(smoke_WeighableLayerWithoutFqTest, WeighableLayerWithoutFqTest,
+                        ::testing::Combine(
+                                ::testing::ValuesIn(netPrecisions),
+                                ::testing::ValuesIn(inputShapes),
+                                ::testing::ValuesIn(constantShapes),
+                                ::testing::Values(CommonTestUtils::DEVICE_GNA),
+                                ::testing::ValuesIn(configs)),
+                        WeighableLayerWithoutFqTest::getTestCaseName);
+} // namespace
+} // namespace SubgraphTestsDefinitions