forked from openvinotoolkit/openvino
-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
[CPU] Adaptive pooling implementation (openvinotoolkit#6594)
- Loading branch information
1 parent
5a0e2fa
commit d5d101e
Showing
17 changed files
with
870 additions
and
32 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
264 changes: 264 additions & 0 deletions
264
inference-engine/src/mkldnn_plugin/nodes/mkldnn_adaptive_pooling.cpp
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,264 @@ | ||
// Copyright (C) 2021 Intel Corporation | ||
// SPDX-License-Identifier: Apache-2.0 | ||
// | ||
|
||
#include "mkldnn_adaptive_pooling.h" | ||
#include "ie_parallel.hpp" | ||
#include <cpu/x64/cpu_isa_traits.hpp> | ||
#include <math.h> | ||
#include <mkldnn.hpp> | ||
#include <mkldnn_extension_utils.h> | ||
#include <mkldnn_selective_build.h> | ||
#include <mkldnn_types.h> | ||
#include <ngraph/opsets/opset8.hpp> | ||
#include <string> | ||
#include <utils/bfloat16.hpp> | ||
#include <utils/general_utils.h> | ||
#include <vector> | ||
|
||
using namespace MKLDNNPlugin; | ||
using namespace InferenceEngine; | ||
using namespace mkldnn; | ||
using namespace mkldnn::impl::cpu::x64; | ||
|
||
bool MKLDNNAdaptivePoolingNode::isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept { | ||
try { | ||
if (one_of(op->get_type_info(), ngraph::op::v8::AdaptiveAvgPool::type_info)) { | ||
auto adaPool = std::dynamic_pointer_cast<ngraph::opset8::AdaptiveAvgPool>(op); | ||
if (!adaPool) { | ||
errorMessage = "Only opset8 AdaptiveAvgPooling operation is supported"; | ||
return false; | ||
} | ||
} else if (one_of(op->get_type_info(), ngraph::op::v8::AdaptiveMaxPool::type_info)) { | ||
auto adaPool = std::dynamic_pointer_cast<ngraph::opset8::AdaptiveMaxPool>(op); | ||
if (!adaPool) { | ||
errorMessage = "Only opset8 AdaptiveMaxPooling operation is supported"; | ||
return false; | ||
} | ||
} else { | ||
errorMessage = "Unsupported Adaptive pooling mode"; | ||
return false; | ||
} | ||
} catch (...) { | ||
return false; | ||
} | ||
return true; | ||
} | ||
|
||
MKLDNNAdaptivePoolingNode::MKLDNNAdaptivePoolingNode(const std::shared_ptr<ngraph::Node>& op, const mkldnn::engine& eng, | ||
MKLDNNWeightsSharing::Ptr &cache) : MKLDNNNode(op, eng, cache) { | ||
std::string errorMessage; | ||
if (isSupportedOperation(op, errorMessage)) { | ||
errorPrefix = "Adaptive Pooling layer with name '" + getName() + "' "; | ||
} else { | ||
IE_THROW(NotImplemented) << errorMessage; | ||
} | ||
if (one_of(op->get_type_info(), ngraph::op::v8::AdaptiveAvgPool::type_info)) { | ||
algorithm = Algorithm::AdaptivePoolingAvg; | ||
} else if (one_of(op->get_type_info(), ngraph::op::v8::AdaptiveMaxPool::type_info)) { | ||
algorithm = Algorithm::AdaptivePoolingMax; | ||
} | ||
} | ||
|
||
void MKLDNNAdaptivePoolingNode::getSupportedDescriptors() { | ||
if (!descs.empty()) | ||
return; | ||
|
||
if (getParentEdges().size() != 2) | ||
IE_THROW() << errorPrefix << "has incorrect number of input edges: " << getParentEdges().size(); | ||
if (getChildEdges().size() != (algorithm == AdaptivePoolingMax ? 2 : 1)) | ||
IE_THROW() << errorPrefix << "has incorrect number of output edges: " << getParentEdges().size(); | ||
|
||
auto parentDims = getParentEdgeAt(0)->getDims(); | ||
auto childDims = getChildEdgeAt(0)->getDims(); | ||
|
||
spatialDimsCount = parentDims.ndims() - 2; | ||
if (!one_of(spatialDimsCount, 1, 2, 3)) { | ||
IE_THROW() << errorPrefix << "doesn't support 0th input with rank: " << getParentEdgeAt(0)->getDims().ndims(); | ||
} | ||
|
||
if (getParentEdgeAt(1)->getDims().ndims() != 1) { | ||
IE_THROW() << errorPrefix << "doesn't support 1st input with rank: " << getParentEdgeAt(1)->getDims().ndims(); | ||
} | ||
|
||
if (getChildEdgeAt(0)->getDims().ndims() != getParentEdgeAt(0)->getDims().ndims()) { | ||
IE_THROW() << errorPrefix << "must keep data rank"; | ||
} | ||
} | ||
|
||
void MKLDNNAdaptivePoolingNode::initSupportedPrimitiveDescriptors() { | ||
if (!supportedPrimitiveDescriptors.empty()) | ||
return; | ||
|
||
// we supports only fp32 currently | ||
precision = Precision::FP32; | ||
|
||
InferenceEngine::LayerConfig config; | ||
config.dynBatchSupport = false; | ||
config.inConfs.resize(2); | ||
config.outConfs.resize((algorithm == Algorithm::AdaptivePoolingAvg ? 1 : 2)); | ||
|
||
std::vector<TensorDescCreatorTypes> dataFormats{ TensorDescCreatorTypes::ncsp }; | ||
if (getParentEdgeAt(0)->getDims()[1] != 1) { | ||
dataFormats.push_back(TensorDescCreatorTypes::nspc); | ||
dataFormats.push_back(TensorDescCreatorTypes::nCsp16c); | ||
dataFormats.push_back(TensorDescCreatorTypes::nCsp8c); | ||
} | ||
for (const auto &df : dataFormats) { | ||
if (algorithm == Algorithm::AdaptivePoolingAvg) { | ||
addSupportedPrimDesc({{df, precision}, {TensorDescCreatorTypes::ncsp, Precision::I32}}, | ||
{{df, precision}}, | ||
impl_desc_type::unknown); | ||
} else { | ||
addSupportedPrimDesc({{df, precision}, {TensorDescCreatorTypes::ncsp, Precision::I32}}, | ||
{{df, precision}, {TensorDescCreatorTypes::ncsp, Precision::I32}}, | ||
impl_desc_type::unknown); | ||
} | ||
} | ||
} | ||
|
||
void MKLDNNAdaptivePoolingNode::execute(mkldnn::stream strm) { | ||
auto inputPrec = getParentEdgeAt(0)->getMemory().GetDescriptor().data.data_type; | ||
auto outputPrec = getChildEdgeAt(0)->getMemory().GetDescriptor().data.data_type; | ||
if (!(inputPrec == mkldnn_f32 && outputPrec == mkldnn_f32)) | ||
IE_THROW() << errorPrefix << "doesn't support demanded precisions"; | ||
|
||
auto &srcMemory0 = getParentEdgeAt(0)->getMemory(); | ||
auto &srcMemory1 = getParentEdgeAt(1)->getMemory(); | ||
int *indexDst = nullptr; | ||
|
||
if (algorithm == Algorithm::AdaptivePoolingMax) { | ||
indexDst = reinterpret_cast<int *>(getChildEdgeAt(1)->getMemoryPtr()->GetPtr()); | ||
} | ||
|
||
auto srcBlockDesc = srcMemory0.GetDescriptor().data.format_desc.blocking; | ||
|
||
int blockSize = srcBlockDesc.inner_nblks > 0 ? srcBlockDesc.inner_blks[0] : 1; | ||
auto isPlainFmt = srcMemory0.GetDesc().isPlainFormat(); | ||
auto isTailCFmt = srcMemory0.GetDesc().isTailCFormat(); | ||
|
||
const auto *src = reinterpret_cast<const float *>(getParentEdgeAt(0)->getMemoryPtr()->GetPtr()); | ||
const auto *srcPooledSpatialShapes = reinterpret_cast<const int *>(getParentEdgeAt(1)->getMemoryPtr()->GetPtr()); | ||
auto *dst = reinterpret_cast<float *>(getChildEdgeAt(0)->getMemoryPtr()->GetPtr()); | ||
|
||
if (srcMemory1.GetElementsCount() != spatialDimsCount) | ||
IE_THROW() << errorPrefix << "has input spatial dimension (" << srcMemory1.GetElementsCount() | ||
<< ") inconsistent with pooling vector size (" << spatialDimsCount << ")"; | ||
|
||
auto inputDimVector = srcMemory0.GetDims(); | ||
const int N = static_cast<int>(inputDimVector[0]); | ||
const int C = static_cast<int>(inputDimVector[1]); | ||
const int ID = static_cast<int>(spatialDimsCount == 3 ? inputDimVector[2] : 1); | ||
const int IH = static_cast<int>(spatialDimsCount >= 2 ? inputDimVector[spatialDimsCount] : 1); | ||
const int IW = static_cast<int>(inputDimVector[spatialDimsCount + 1]); | ||
|
||
const int OD = static_cast<int>(spatialDimsCount == 3 ? srcPooledSpatialShapes[0] : 1); | ||
const int OH = static_cast<int>(spatialDimsCount >= 2 ? srcPooledSpatialShapes[spatialDimsCount - 2] : 1); | ||
const int OW = static_cast<int>(srcPooledSpatialShapes[spatialDimsCount - 1]); | ||
|
||
const int iHW = IH * IW; | ||
const int oDHW = OD * OH * OW, oHW = OH * OW; | ||
|
||
const int chPadding = srcMemory0.GetDescriptor().data.padded_dims[1]; | ||
const int blockCount = (isTailCFmt ? 1 : chPadding / blockSize); | ||
auto selectedPrimitiveDescriptor = getSelectedPrimitiveDescriptor(); | ||
if (!selectedPrimitiveDescriptor) | ||
IE_THROW() << errorPrefix << "doesn't have primitive descriptors."; | ||
auto config = selectedPrimitiveDescriptor->getConfig(); | ||
auto srcStrides = config.inConfs[0].desc.getBlockingDesc().getStrides(); | ||
auto dstStrides = config.outConfs[0].desc.getBlockingDesc().getStrides(); | ||
|
||
// unified strides array | ||
const size_t tailDimsOffset = (isTailCFmt ? -1 : 0); | ||
const size_t inStrides[5] = { | ||
srcStrides[0], | ||
(isTailCFmt ? 1 : srcStrides[1]), | ||
(spatialDimsCount == 3 ? srcStrides[2 + tailDimsOffset] : 0), | ||
(spatialDimsCount >= 2 ? srcStrides[spatialDimsCount + tailDimsOffset] : 0), | ||
srcStrides[spatialDimsCount + 1 + tailDimsOffset] }; | ||
const size_t outStrides[5] = { | ||
dstStrides[0], | ||
(isTailCFmt ? 1 : dstStrides[1]), | ||
(spatialDimsCount == 3 ? dstStrides[2 + tailDimsOffset] : 0), | ||
(spatialDimsCount >= 2 ? dstStrides[spatialDimsCount + tailDimsOffset] : 0), | ||
dstStrides[spatialDimsCount + 1 + tailDimsOffset] }; | ||
|
||
std::function<void(const float *, float *, int, int, int, size_t)> pool; | ||
auto poolMax = [&] (const float *srcData, float *dstData, int od, int oh, int ow, size_t spatIndOff) { | ||
size_t dStart, dEnd, hStart, hEnd, wStart, wEnd; | ||
setBinBorders(&dStart, &dEnd, od, ID, OD); | ||
setBinBorders(&hStart, &hEnd, oh, IH, OH); | ||
setBinBorders(&wStart, &wEnd, ow, IW, OW); | ||
float res = srcData[dStart * inStrides[2] + hStart * inStrides[3] + wStart * inStrides[4]]; // initial max value | ||
int resIndex = dStart * iHW + hStart * IW + wStart; // initial max index | ||
for (size_t pixD = dStart; pixD < dEnd; pixD++) { | ||
for (size_t pixH = hStart; pixH < hEnd; pixH++) { | ||
for (size_t pixW = wStart; pixW < wEnd; pixW++) { | ||
float curr = srcData[pixD * inStrides[2] + pixH * inStrides[3] + pixW * inStrides[4]]; | ||
resIndex = (res < curr ? pixD * iHW + pixH * IW + pixW : resIndex); | ||
res = std::max(res, curr); | ||
} | ||
} | ||
} | ||
*dstData = res; | ||
indexDst[spatIndOff * oDHW + od * oHW + oh * OW + ow] = resIndex; | ||
}; | ||
auto poolAvg = [&] (const float *srcData, float *dstData, int od, int oh, int ow, size_t spatIndOff) { | ||
size_t dStart, dEnd, hStart, hEnd, wStart, wEnd; | ||
setBinBorders(&dStart, &dEnd, od, ID, OD); | ||
setBinBorders(&hStart, &hEnd, oh, IH, OH); | ||
setBinBorders(&wStart, &wEnd, ow, IW, OW); | ||
auto binSize = (dEnd - dStart) * (hEnd - hStart) * (wEnd - wStart); | ||
if (binSize == 0) | ||
IE_THROW() << errorPrefix << "has empty bin"; | ||
float sum = 0; | ||
for (size_t pixD = dStart; pixD < dEnd; pixD++) { | ||
for (size_t pixH = hStart; pixH < hEnd; pixH++) { | ||
for (size_t pixW = wStart; pixW < wEnd; pixW++) { | ||
float curr = srcData[pixD * inStrides[2] + pixH * inStrides[3] + pixW * inStrides[4]]; | ||
sum = sum + curr; | ||
} | ||
} | ||
} | ||
*dstData = sum / binSize; | ||
}; | ||
|
||
if (algorithm == Algorithm::AdaptivePoolingMax) { | ||
pool = poolMax; | ||
} else { | ||
pool = poolAvg; | ||
} | ||
|
||
parallel_for5d(N, blockCount, OD, OH, OW, | ||
[&](int n, int blkIdx, int od, int oh, int ow) { | ||
auto srcData = src + n * inStrides[0] + blkIdx * inStrides[1]; | ||
auto dstData = dst + n * outStrides[0] + blkIdx * outStrides[1] + | ||
od * outStrides[2] + oh * outStrides[3] + ow * outStrides[4]; | ||
int cStart = 0, cEnd = C, inResidual = 0, outResidual = 0; | ||
if (!isTailCFmt) { | ||
cStart = blkIdx * blockSize; | ||
cEnd = (blkIdx == blockCount - 1 ? C : cStart + blockSize); | ||
} | ||
for (int c = cStart; c < cEnd; c++) { | ||
if (isTailCFmt) { | ||
inResidual = c * inStrides[1]; | ||
outResidual = c * outStrides[1]; | ||
} else if (!isPlainFmt) { | ||
inResidual = outResidual = c % blockSize; | ||
} | ||
pool(srcData + inResidual, dstData + outResidual, od, oh, ow, n * C + c); | ||
}}); | ||
} | ||
|
||
bool MKLDNNAdaptivePoolingNode::created() const { | ||
return getType() == AdaptivePooling; | ||
} | ||
|
||
void MKLDNNAdaptivePoolingNode::createPrimitive() {} | ||
|
||
inline void MKLDNNAdaptivePoolingNode::setBinBorders(size_t *startPtr, size_t *endPtr, size_t idx, size_t inputLength, size_t outputLength) { | ||
*(startPtr) = idx * inputLength / outputLength; | ||
*(endPtr) = ceil(static_cast<float>((idx + 1) * inputLength) / outputLength); | ||
} | ||
|
||
REG_MKLDNN_PRIM_FOR(MKLDNNAdaptivePoolingNode, AdaptivePooling) |
35 changes: 35 additions & 0 deletions
35
inference-engine/src/mkldnn_plugin/nodes/mkldnn_adaptive_pooling.h
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,35 @@ | ||
// Copyright (C) 2021 Intel Corporation | ||
// SPDX-License-Identifier: Apache-2.0 | ||
// | ||
|
||
#pragma once | ||
|
||
#include <mkldnn_node.h> | ||
#include <string> | ||
#include <memory> | ||
#include <vector> | ||
#include <mkldnn_extension_utils.h> | ||
|
||
namespace MKLDNNPlugin { | ||
|
||
class MKLDNNAdaptivePoolingNode : public MKLDNNNode { | ||
public: | ||
MKLDNNAdaptivePoolingNode(const std::shared_ptr<ngraph::Node>& op, const mkldnn::engine& eng, MKLDNNWeightsSharing::Ptr &cache); | ||
|
||
void getSupportedDescriptors() override; | ||
void initSupportedPrimitiveDescriptors() override; | ||
void createPrimitive() override; | ||
void execute(mkldnn::stream strm) override; | ||
bool created() const override; | ||
|
||
static bool isSupportedOperation(const std::shared_ptr<ngraph::Node>& op, std::string& errorMessage) noexcept; | ||
|
||
private: | ||
int spatialDimsCount; | ||
InferenceEngine::Precision precision = InferenceEngine::Precision::FP32; | ||
inline void setBinBorders(size_t *startPtr, size_t *endPtr, size_t idx, size_t inputLength, size_t outputLength); | ||
|
||
std::string errorPrefix; | ||
}; | ||
|
||
} // namespace MKLDNNPlugin |
58 changes: 58 additions & 0 deletions
58
...ests/functional/plugin/cpu/shared_tests_instances/single_layer_tests/adaptive_pooling.cpp
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,58 @@ | ||
// Copyright (C) 2021 Intel Corporation | ||
// SPDX-License-Identifier: Apache-2.0 | ||
// | ||
|
||
#include <vector> | ||
|
||
#include "single_layer_tests/adaptive_pooling.hpp" | ||
#include "common_test_utils/test_constants.hpp" | ||
|
||
using namespace LayerTestsDefinitions; | ||
|
||
|
||
const std::vector<InferenceEngine::Precision> netPRCs = { | ||
InferenceEngine::Precision::FP16, | ||
InferenceEngine::Precision::FP32 | ||
}; | ||
|
||
const auto AdaPool3DCases = ::testing::Combine( | ||
::testing::ValuesIn( | ||
std::vector<std::vector<size_t>> { | ||
{ 1, 2, 1}, | ||
{ 1, 1, 3 }, | ||
{ 3, 17, 5 }}), | ||
::testing::ValuesIn(std::vector<std::vector<int>>{ {1}, {3}, {5} }), | ||
::testing::ValuesIn(std::vector<std::string>{"max", "avg"}), | ||
::testing::ValuesIn(netPRCs), | ||
::testing::Values(CommonTestUtils::DEVICE_CPU) | ||
); | ||
|
||
INSTANTIATE_TEST_SUITE_P(smoke_TestsAdaPool3D, AdaPoolLayerTest, AdaPool3DCases, AdaPoolLayerTest::getTestCaseName); | ||
|
||
const auto AdaPool4DCases = ::testing::Combine( | ||
::testing::ValuesIn( | ||
std::vector<std::vector<size_t>> { | ||
{ 1, 2, 1, 2}, | ||
{ 1, 1, 3, 2}, | ||
{ 3, 17, 5, 1}}), | ||
::testing::ValuesIn(std::vector<std::vector<int>>{ {1, 1}, {3, 5}, {5, 5} }), | ||
::testing::ValuesIn(std::vector<std::string>{"max", "avg"}), | ||
::testing::ValuesIn(netPRCs), | ||
::testing::Values(CommonTestUtils::DEVICE_CPU) | ||
); | ||
|
||
INSTANTIATE_TEST_SUITE_P(smoke_TestsAdaPool4D, AdaPoolLayerTest, AdaPool4DCases, AdaPoolLayerTest::getTestCaseName); | ||
|
||
const auto AdaPool5DCases = ::testing::Combine( | ||
::testing::ValuesIn( | ||
std::vector<std::vector<size_t>> { | ||
{ 1, 2, 1, 2, 2}, | ||
{ 1, 1, 3, 2, 3}, | ||
{ 3, 17, 5, 1, 2}}), | ||
::testing::ValuesIn(std::vector<std::vector<int>>{ {1, 1, 1}, {3, 5, 3}, {5, 5, 5} }), | ||
::testing::ValuesIn(std::vector<std::string>{"max", "avg"}), | ||
::testing::ValuesIn(netPRCs), | ||
::testing::Values(CommonTestUtils::DEVICE_CPU) | ||
); | ||
|
||
INSTANTIATE_TEST_SUITE_P(smoke_TestsAdaPool5D, AdaPoolLayerTest, AdaPool5DCases, AdaPoolLayerTest::getTestCaseName); |
Oops, something went wrong.