[CPU BF16] BF16 support was added to the SoftMax primitive. (#4279)

2021-02-16 09:41:21 +03:00 · 2021-02-16 09:41:21 +03:00 · 274a70bd14
commit 274a70bd14
parent 75eca09abd
4 changed files with 135 additions and 3 deletions
--- a/inference-engine/src/mkldnn_plugin/bf16transformer.h
+++ b/inference-engine/src/mkldnn_plugin/bf16transformer.h
@ -23,7 +23,7 @@ class BF16Transformer {
          "broadcast", "convert", "BatchToSpace", "DepthToSpace", "ExtractImagePatches", "concat", "power", "lrn",
          "permute", "ScatterUpdate", "ScatterElementsUpdate", "ScatterNDUpdate", "depthwise",
          "select", "ShuffleChannels", "SpaceToBatch", "SpaceToDepth", "squeeze", "StridedSlice", "unsqueeze", "eltwise",
-          "ReduceAnd", "ReduceOr", "ReduceMax", "ReduceMin", "ScaleShift"};
+          "ReduceAnd", "ReduceOr", "ReduceMax", "ReduceMin", "ScaleShift", "SoftMax"};
    const InferenceEngine::details::caseless_set<std::string> _multiinput =
        { "concat", "eltwise" };
--- a/inference-engine/src/mkldnn_plugin/nodes/mkldnn_softmax_node.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/mkldnn_softmax_node.cpp
@ -21,7 +21,7 @@ void MKLDNNSoftMaxNode::getSupportedDescriptors() {
        return;
    InferenceEngine::Precision precision = getCnnLayer()->insData[0].lock()->getPrecision();
-    if (precision != InferenceEngine::Precision::FP32)
+    if (precision != InferenceEngine::Precision::FP32 && precision != InferenceEngine::Precision::BF16)
        precision = InferenceEngine::Precision::FP32;
    auto inputDataType = MKLDNNExtensionUtils::IEPrecisionToDataType(precision);
--- a/inference-engine/tests/functional/plugin/cpu/single_layer_tests/softmax.cpp
+++ b/inference-engine/tests/functional/plugin/cpu/single_layer_tests/softmax.cpp
@ -0,0 +1,132 @@
 // Copyright (C) 2021 Intel Corporation
 // SPDX-License-Identifier: Apache-2.0
 //
 #include <ngraph_functions/builders.hpp>
 #include "test_utils/cpu_test_utils.hpp"
 using namespace InferenceEngine;
 using namespace CPUTestUtils;
 namespace CPULayerTestsDefinitions {
 struct SoftMaxConfig {
    InferenceEngine::SizeVector  inputShape;
    size_t axis;
 };
 typedef std::tuple<
    InferenceEngine::Precision,         // netPrecision
    SoftMaxConfig,                      // softmaxTestConfig
    std::string,                        // targetDevice
    CPUSpecificParams
 > softmaxCPUTestParams;
 class SoftMaxLayerCPUTest : public testing::WithParamInterface<softmaxCPUTestParams>,
                            virtual public LayerTestsUtils::LayerTestsCommon, public CPUTestsBase {
 public:
    static std::string getTestCaseName(const testing::TestParamInfo<softmaxCPUTestParams>& obj) {
        CPUSpecificParams cpuParams;
        InferenceEngine::Precision netPrecision;
        SoftMaxConfig config;
        std::string targetDevice;
        std::tie(netPrecision, config, targetDevice, cpuParams) = obj.param;
        std::ostringstream result;
        result << "netPRC=" << netPrecision.name() << "_";
        result << "IS=" << CommonTestUtils::vec2str(config.inputShape) << "_";
        result << "axis=" << config.axis << "_";
        result << "trgDev=" << targetDevice;
        result << CPUTestsBase::getTestCaseName(cpuParams);
        return result.str();
    }
 protected:
    void SetUp() override {
        InferenceEngine::Precision netPrecision;
        SoftMaxConfig config;
        CPUSpecificParams cpuParams;
        std::tie(netPrecision, config, targetDevice, cpuParams) = this->GetParam();
        inPrc = outPrc = netPrecision;
        std::tie(inFmts, outFmts, priority, selectedType) = cpuParams;
        if (selectedType.empty()) {
            selectedType = getPrimitiveType();
        }
        selectedType.push_back('_');
        selectedType += inPrc.name();
        const auto ngPrc = FuncTestUtils::PrecisionUtils::convertIE2nGraphPrc(netPrecision);
        auto params = ngraph::builder::makeParams(ngPrc, {config.inputShape});
        const auto paramOuts =
                ngraph::helpers::convert2OutputVector(ngraph::helpers::castOps2Nodes<ngraph::op::Parameter>(params));
        const auto softMax = std::make_shared<ngraph::opset1::Softmax>(paramOuts.at(0), config.axis);
        function = makeNgraphFunction(ngPrc, params, softMax, "SoftMax");
    }
 };
 TEST_P(SoftMaxLayerCPUTest, CompareWithRefs) {
    SKIP_IF_CURRENT_TEST_IS_DISABLED()
    Run();
    CheckPluginRelatedResults(executableNetwork, "SoftMax");
 }
 namespace {
 //not optimized cpu spec
 const auto notOptimizedCPUSpec = CPUSpecificParams{{}, {}, {}, "ref_any"};
 const std::vector<SoftMaxConfig> optimizedConfigsFP32 {
        {InferenceEngine::SizeVector{1, 100}, 1},
        {InferenceEngine::SizeVector{10, 10}, 1},
        {InferenceEngine::SizeVector{100, 1}, 0},
        {InferenceEngine::SizeVector{100, 1}, 1},
        {InferenceEngine::SizeVector{5, 5, 1}, 1},
        {InferenceEngine::SizeVector{5, 5, 5}, 2},
        {InferenceEngine::SizeVector{5, 5, 5, 5}, 0},
        {InferenceEngine::SizeVector{5, 5, 1, 1}, 1},
        {InferenceEngine::SizeVector{5, 5, 5, 5}, 1},
        {InferenceEngine::SizeVector{5, 5, 5, 1}, 2},
        {InferenceEngine::SizeVector{5, 5, 5, 5}, 2},
        {InferenceEngine::SizeVector{5, 5, 5, 5}, 3},
        {InferenceEngine::SizeVector{5, 5, 5, 5, 5}, 0},
        {InferenceEngine::SizeVector{5, 5, 1, 1, 1}, 1},
        {InferenceEngine::SizeVector{5, 5, 5, 5, 5}, 1},
        {InferenceEngine::SizeVector{5, 5, 5, 1, 1}, 2},
        {InferenceEngine::SizeVector{5, 5, 5, 5, 5}, 2},
        {InferenceEngine::SizeVector{5, 5, 5, 1, 1}, 3},
        {InferenceEngine::SizeVector{5, 5, 5, 5, 5}, 3},
        {InferenceEngine::SizeVector{5, 5, 5, 5, 1}, 4},
        {InferenceEngine::SizeVector{5, 5, 5, 5, 5}, 4},
 };
 const std::vector<SoftMaxConfig> notOptimizedConfigsFP32 {
        {InferenceEngine::SizeVector{1, 100}, 0},
        {InferenceEngine::SizeVector{10, 10}, 0},
        {InferenceEngine::SizeVector{10, 10, 10}, 0},
        {InferenceEngine::SizeVector{10, 10, 10}, 1},
 };
 const auto OptimizedParams = testing::Combine(
        testing::Values(Precision::FP32, Precision::BF16),
        testing::ValuesIn(optimizedConfigsFP32),
        testing::Values(CommonTestUtils::DEVICE_CPU),
        testing::Values(emptyCPUSpec));
 INSTANTIATE_TEST_CASE_P(smoke_SoftMax_Optimized_CPU, SoftMaxLayerCPUTest, OptimizedParams, SoftMaxLayerCPUTest::getTestCaseName);
 const auto NotOptimizedParams = testing::Combine(
        testing::Values(Precision::FP32, Precision::BF16),
        testing::ValuesIn(notOptimizedConfigsFP32),
        testing::Values(CommonTestUtils::DEVICE_CPU),
        testing::Values(notOptimizedCPUSpec));
 INSTANTIATE_TEST_CASE_P(smoke_SoftMax_CPU, SoftMaxLayerCPUTest, NotOptimizedParams, SoftMaxLayerCPUTest::getTestCaseName);
 } // namespace
 } // namespace CPULayerTestsDefinitions
--- a/inference-engine/thirdparty/mkl-dnn
+++ b/inference-engine/thirdparty/mkl-dnn
@ -1 +1 @@
-Subproject commit f2b67dc5bc8de2e6c5603bfb1c22ab1a3d865cc7
+Subproject commit e8879c1c30daaf85a9aab6323a167138b59653fa
		`@ -1 +1 @@`
			`Subproject commit f2b67dc5bc8de2e6c5603bfb1c22ab1a3d865cc7`				`Subproject commit e8879c1c30daaf85a9aab6323a167138b59653fa`