[NGraph] Add scatterNDUpdate and scatterUpdate reference implementations (#1494)

2020-08-07 16:09:28 +03:00 · 2020-08-07 16:09:28 +03:00 · 4054364fbf
commit 4054364fbf
parent caa38130b9
11 changed files with 235 additions and 200 deletions
--- a/inference-engine/src/mkldnn_plugin/CMakeLists.txt
+++ b/inference-engine/src/mkldnn_plugin/CMakeLists.txt
@ -64,7 +64,6 @@ set(LAYERS
    ${CMAKE_CURRENT_SOURCE_DIR}/nodes/gather_tree.cpp
    ${CMAKE_CURRENT_SOURCE_DIR}/nodes/grn.cpp
    ${CMAKE_CURRENT_SOURCE_DIR}/nodes/non_max_suppression.cpp
    ${CMAKE_CURRENT_SOURCE_DIR}/nodes/scatter.cpp
    ${CMAKE_CURRENT_SOURCE_DIR}/nodes/log_softmax.cpp
    ${CMAKE_CURRENT_SOURCE_DIR}/nodes/math.cpp
    ${CMAKE_CURRENT_SOURCE_DIR}/nodes/one_hot.cpp
--- a/inference-engine/src/mkldnn_plugin/nodes/list_tbl.hpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/list_tbl.hpp
@ -51,7 +51,6 @@ MKLDNN_EXTENSION_NODE(FillImpl, Fill);
 MKLDNN_EXTENSION_NODE(UniqueImpl, Unique);
 MKLDNN_EXTENSION_NODE(PSROIPoolingImpl, PSROIPooling);
 MKLDNN_EXTENSION_NODE(DepthToSpaceImpl, DepthToSpace);
 MKLDNN_EXTENSION_NODE(ScatterImpl, ScatterUpdate);
 MKLDNN_EXTENSION_NODE(OneHotImpl, OneHot);
 MKLDNN_EXTENSION_NODE(BroadcastImpl, Broadcast);
 MKLDNN_EXTENSION_NODE(ExperimentalSparseWeightedReduceImpl, ExperimentalSparseWeightedSum);
--- a/inference-engine/src/mkldnn_plugin/nodes/scatter.cpp
+++ b/inference-engine/src/mkldnn_plugin/nodes/scatter.cpp
@ -1,188 +0,0 @@
 // Copyright (C) 2018-2020 Intel Corporation
 // SPDX-License-Identifier: Apache-2.0
 //
 #include "base.hpp"
 #include <cmath>
 #include <string>
 #include <vector>
 #include <cassert>
 #include <algorithm>
 #include <limits>
 #include "ie_parallel.hpp"
 #include "common/simple_copy.h"
 namespace InferenceEngine {
 namespace Extensions {
 namespace Cpu {
 class ScatterImpl: public ExtLayerBase {
 public:
    explicit ScatterImpl(const CNNLayer* layer) {
        try {
            if (layer->insData.size() != 3 || layer->outData.size() != 1)
                THROW_IE_EXCEPTION << layer->name << " Incorrect number of input/output tensors!";
            Precision inIdxPrecision = layer->insData[SCATTER_INDEXES].lock()->getTensorDesc().getPrecision();
            if (inIdxPrecision != Precision::FP32 && inIdxPrecision != Precision::I32)
                THROW_IE_EXCEPTION << layer->name << " Incorrect input 'Indexes' precision. Only FP32 or I32 are supported!";
            Precision inDataPrecision = layer->insData[SCATTER_DATA].lock()->getTensorDesc().getPrecision();
            if (inDataPrecision != layer->insData[SCATTER_UPDATES].lock()->getTensorDesc().getPrecision())
                THROW_IE_EXCEPTION << layer->name << " Precision should be equal for input tensors 'Data' and 'Updates'";
            //  Remove redundant dimensions
            const SizeVector& data_dims = layer->insData[SCATTER_DATA].lock()->getTensorDesc().getDims();
            if (data_dims.size() == 0 ||
                (data_dims.size() == 1 && data_dims[0] == 1) ||
                layer->insData[SCATTER_DATA].lock()->getTensorDesc().getLayout() == Layout::SCALAR)
                    THROW_IE_EXCEPTION << layer->name << " 'Data' tensor rank should be >= 1";
            axis = layer->GetParamAsInt("axis", 0);
            IE_ASSERT(-static_cast<int>(data_dims.size()) <= axis && axis < static_cast<int>(data_dims.size()))
                << layer->name << " Incorrect input parameters dimensions and axis number!";
            if (axis < 0)
                axis += data_dims.size();
            SizeVector dst_dims = layer->outData[0]->getTensorDesc().getDims();
            if (data_dims != dst_dims)
                THROW_IE_EXCEPTION << layer->name << " Incorrect number of input/output dimensions!";
            SizeVector idx_dims = layer->insData[SCATTER_INDEXES].lock()->getTensorDesc().getDims();
            if (idx_dims.size() == 0 ||
                (idx_dims.size() == 1 && idx_dims[0] == 1) ||
                layer->insData[SCATTER_INDEXES].lock()->getTensorDesc().getLayout() == Layout::SCALAR)
                THROW_IE_EXCEPTION << layer->name << " 'Indexes' tensor rank should be >= 1";
            SizeVector upd_dims = layer->insData[SCATTER_UPDATES].lock()->getTensorDesc().getDims();
            if (layer->insData[SCATTER_UPDATES].lock()->getTensorDesc().getLayout() == Layout::SCALAR)
                THROW_IE_EXCEPTION << layer->name << " 'Indexes' tensor rank should be >= 1";
            if (idx_dims != upd_dims)
                THROW_IE_EXCEPTION << layer->name << " Incorrect number of 'indexes' and 'updates' tensors dimension";
            for (size_t i = 0; i < idx_dims.size(); i++) {
                if (i == static_cast<size_t>(axis)) continue;
                if (idx_dims[i] > data_dims[i])
                    THROW_IE_EXCEPTION << layer->name << " Incorrect number of data and indexes dimensions!";
            }
            LayerConfig config;
            DataConfig dataConfig, indexesConfig, updatesConfig;
            Precision dataPrecision = layer->outData[0]->getTensorDesc().getPrecision();
            dataConfig.desc = TensorDesc(dataPrecision, data_dims,
                                         layer->insData[SCATTER_DATA].lock()->getTensorDesc().getLayout());
            dataConfig.constant = false;
            dataConfig.inPlace = 0;
            config.inConfs.push_back(dataConfig);
            indexesConfig.desc = TensorDesc(inIdxPrecision, idx_dims,
                                            layer->insData[SCATTER_INDEXES].lock()->getTensorDesc().getLayout());
            config.inConfs.push_back(indexesConfig);
            updatesConfig.desc = TensorDesc(dataPrecision, upd_dims,
                                            layer->insData[SCATTER_UPDATES].lock()->getTensorDesc().getLayout());
            config.inConfs.push_back(updatesConfig);
            DataConfig outConfig;
            outConfig.desc = TensorDesc(dataPrecision, dst_dims, layer->outData[0]->getTensorDesc().getLayout());
            outConfig.constant = false;
            outConfig.inPlace = 0;
            config.outConfs.push_back(outConfig);
            config.dynBatchSupport = false;
            confs.push_back(config);
        } catch (InferenceEngine::details::InferenceEngineException &ex) {
            errorMsg = ex.what();
        }
    }
    StatusCode execute(std::vector<Blob::Ptr>& inputs, std::vector<Blob::Ptr>& outputs, ResponseDesc *resp) noexcept override {
        switch (inputs[SCATTER_INDEXES]->getTensorDesc().getPrecision()) {
            case Precision::FP32:
                scatter<float>(inputs[SCATTER_DATA], inputs[SCATTER_INDEXES], inputs[SCATTER_UPDATES], outputs[0]);
                break;
            case Precision::I32:
                scatter<int32_t>(inputs[SCATTER_DATA], inputs[SCATTER_INDEXES], inputs[SCATTER_UPDATES], outputs[0]);
                break;
            default:
                return GENERAL_ERROR;
        }
        return OK;
    }
 private:
    template <typename index_t>
    void scatter(Blob::Ptr data, Blob::Ptr indexes, Blob::Ptr updates, Blob::Ptr output) {
        const uint8_t *src_data = data->cbuffer().as<const uint8_t *>() + data->getTensorDesc().getBlockingDesc().getOffsetPadding();
        const index_t *src_index = indexes->cbuffer().as<const index_t *>() + indexes->getTensorDesc().getBlockingDesc().getOffsetPadding();
        const uint8_t *src_updates = updates->cbuffer().as<const uint8_t *>() + updates->getTensorDesc().getBlockingDesc().getOffsetPadding();
        uint8_t *dst_data = output->cbuffer().as<uint8_t*>() + output->getTensorDesc().getBlockingDesc().getOffsetPadding();
        size_t data_size = data->getTensorDesc().getPrecision().size();
        InferenceEngine::SizeVector index_dims = indexes->getTensorDesc().getDims();
        InferenceEngine::SizeVector data_dims = data->getTensorDesc().getDims();
        InferenceEngine::SizeVector dataStrides = data->getTensorDesc().getBlockingDesc().getStrides();
        if (src_data != dst_data) {
            parallel_nt(0, [&](const int ithr, const int nthr) {
                size_t start = 0, end = 0;
                splitter(output->size(), nthr, ithr, start, end);
                size_t size = (end - start) * data_size;
                start *= data_size;
                simple_copy(dst_data + start, size, src_data + start, size);
            });
        }
        parallel_nt(0, [&](const int ithr, const int nthr) {
            int j;
            size_t i, dst_idx = 0, start = 0, end = 0;
            SizeVector counters(index_dims.size(), 0);
            splitter(indexes->size(), nthr, ithr, start, end);
            for (j = index_dims.size() - 1, i = start; j >= 0; j--) {
                counters[j] = i % index_dims[j];
                i /= index_dims[j];
            }
            for (i = 0; i < static_cast<size_t>(axis); ++i)
                dst_idx += counters[i] * dataStrides[i];
            for (i++; i < data_dims.size(); ++i)
                dst_idx += counters[i] * dataStrides[i];
            for (size_t iwork = start; iwork < end; iwork++) {
                unsigned int idx = static_cast<unsigned int>(src_index[iwork]);
                if (idx < data_dims[axis])
                    simple_copy(dst_data + data_size * (dst_idx + idx * dataStrides[axis]), data_size,
                                src_updates + iwork * data_size, data_size);
                for (j = index_dims.size() - 1; j >= 0; j--) {
                    counters[j]++;
                    if (counters[j] < index_dims[j]) {
                        if (j != static_cast<size_t>(axis))
                            dst_idx += dataStrides[j];
                        break;
                    } else {
                        counters[j] = 0;
                        for (dst_idx = 0, i = 0; i < static_cast<size_t>(axis); ++i)
                            dst_idx += counters[i] * dataStrides[i];
                        for (i++; i < data_dims.size(); ++i)
                            dst_idx += counters[i] * dataStrides[i];
                    }
                }
            }
        });
    }
    int axis = 0;
    const size_t SCATTER_DATA = 0;
    const size_t SCATTER_INDEXES = 1;
    const size_t SCATTER_UPDATES = 2;
 };
 REG_FACTORY_FOR(ScatterImpl, ScatterUpdate);
 }  // namespace Cpu
 }  // namespace Extensions
 }  // namespace InferenceEngine
--- a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/single_layer_tests/scatter_ND_update.cpp
+++ b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/single_layer_tests/scatter_ND_update.cpp
@ -36,7 +36,6 @@ const auto ScatterNDUpdateCases = ::testing::Combine(
        ::testing::Values(CommonTestUtils::DEVICE_CPU)
 );
-// open after ops support in ngraph merged
+INSTANTIATE_TEST_CASE_P(ScatterNDUpdate, ScatterNDUpdateLayerTest, ScatterNDUpdateCases, ScatterNDUpdateLayerTest::getTestCaseName);
 // INSTANTIATE_TEST_CASE_P(ScatterNDUpdate, ScatterNDUpdateLayerTest, ScatterNDUpdateCases, ScatterNDUpdateLayerTest::getTestCaseName);
 }  // namespace
--- a/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/single_layer_tests/scatter_update.cpp
+++ b/inference-engine/tests/functional/plugin/cpu/shared_tests_instances/single_layer_tests/scatter_update.cpp
@ -41,7 +41,6 @@ const auto ScatterUpdateCase = ::testing::Combine(
        ::testing::Values(CommonTestUtils::DEVICE_CPU)
 );
-// open after ngraph reference implementation merged
+INSTANTIATE_TEST_CASE_P(ScatterUpdate, ScatterUpdateLayerTest, ScatterUpdateCase, ScatterUpdateLayerTest::getTestCaseName);
 // INSTANTIATE_TEST_CASE_P(ScatterUpdate, ScatterUpdateLayerTest, ScatterUpdateCase, ScatterUpdateLayerTest::getTestCaseName);
 }  // namespace
--- a/inference-engine/tests/ngraph_functions/include/ngraph_functions/builders.hpp
+++ b/inference-engine/tests/ngraph_functions/include/ngraph_functions/builders.hpp
@ -10,6 +10,7 @@
 #include <ngraph/opsets/opset1.hpp>
 #include <ngraph/opsets/opset2.hpp>
 #include <ngraph/opsets/opset3.hpp>
 #include <ngraph/opsets/opset4.hpp>
 #include "ngraph_functions/utils/data_utils.hpp"
--- a/inference-engine/tests/ngraph_functions/src/scatter_ND_update.cpp
+++ b/inference-engine/tests/ngraph_functions/src/scatter_ND_update.cpp
@ -13,10 +13,8 @@ std::shared_ptr<ngraph::Node> makeScatterNDUpdate(const ngraph::Output<Node> &in
                                                  const std::vector<size_t>& indices,
                                                  const ngraph::Output<Node> &update) {
    auto indicesNode = std::make_shared<ngraph::opset1::Constant>(indicesType, indicesShape, indices);
-    // blocked by ngraph merge
+    auto dtsNode = std::make_shared<ngraph::opset4::ScatterNDUpdate>(in, indicesNode, update);
-    // auto dtsNode = std::make_shared<ngraph::opset3::ScatterNDUpdate>(in, indicesNode, update);
+    return dtsNode;
    // return dtsNode;
    return nullptr;
 }
 }  // namespace builder
--- a/ngraph/test/runtime/interpreter/int_executable.hpp
+++ b/ngraph/test/runtime/interpreter/int_executable.hpp
@ -93,6 +93,8 @@
 #include "op/group_conv.hpp"
 #include "reference/detection_output.hpp"
 #include "reference/scatter_nd_update.hpp"
 #include "reference/scatter_update.hpp"
 namespace ngraph
 {
@ -1144,6 +1146,81 @@ protected:
            break;
        }
        case OP_TYPEID::ScatterNDUpdate_v3:
        {
            const op::ScatterNDUpdate* scatterNDUpd =
                static_cast<const op::v3::ScatterNDUpdate*>(&node);
            auto idxType = scatterNDUpd->get_input_element_type(1);
            if (idxType == element::i32)
            {
                reference::scatterNdUpdate<T, int32_t>(args[0]->get_data_ptr<const T>(),
                                                       args[1]->get_data_ptr<const int32_t>(),
                                                       args[2]->get_data_ptr<const T>(),
                                                       out[0]->get_data_ptr<T>(),
                                                       node.get_input_shape(0),
                                                       node.get_input_shape(1),
                                                       node.get_input_shape(2));
            }
            else if (idxType == element::i64)
            {
                reference::scatterNdUpdate<T, int64_t>(args[0]->get_data_ptr<const T>(),
                                                       args[1]->get_data_ptr<const int64_t>(),
                                                       args[2]->get_data_ptr<const T>(),
                                                       out[0]->get_data_ptr<T>(),
                                                       node.get_input_shape(0),
                                                       node.get_input_shape(1),
                                                       node.get_input_shape(2));
            }
            else
            {
                throw ngraph_error(
                    "ScatterNDUpdate layer support only i32 and i64 'indices' input precision!");
            }
            break;
        }
        case OP_TYPEID::ScatterUpdate_v3:
        {
            const op::v3::ScatterUpdate* scatterUpd =
                static_cast<const op::v3::ScatterUpdate*>(&node);
            if (scatterUpd->get_input_element_type(3) != element::i64)
                throw ngraph_error(
                    "ScatterNDUpdate layer support only i64 'axis' input precision!");
            auto idxType = scatterUpd->get_input_element_type(1);
            if (idxType == element::i32)
            {
                reference::scatterUpdate<T, int32_t, int64_t>(
                    args[0]->get_data_ptr<const T>(),
                    args[1]->get_data_ptr<const int32_t>(),
                    args[2]->get_data_ptr<const T>(),
                    args[3]->get_data_ptr<const int64_t>(),
                    out[0]->get_data_ptr<T>(),
                    node.get_input_shape(0),
                    node.get_input_shape(1),
                    node.get_input_shape(2));
            }
            else if (idxType == element::i64)
            {
                reference::scatterUpdate<T, int64_t, int64_t>(
                    args[0]->get_data_ptr<const T>(),
                    args[1]->get_data_ptr<const int64_t>(),
                    args[2]->get_data_ptr<const T>(),
                    args[3]->get_data_ptr<const int64_t>(),
                    out[0]->get_data_ptr<T>(),
                    node.get_input_shape(0),
                    node.get_input_shape(1),
                    node.get_input_shape(2));
            }
            else
            {
                throw ngraph_error(
                    "ScatterUpdate layer support only i32 and i64 'indices' input precision!");
            }
            break;
        }
        // Fused Ops are not supported in interpreter. They need to be decomposed before execution
        case OP_TYPEID::DepthToSpace:
--- a/ngraph/test/runtime/interpreter/opset_int_tbl.hpp
+++ b/ngraph/test/runtime/interpreter/opset_int_tbl.hpp
@ -37,4 +37,6 @@ NGRAPH_OP(EmbeddingSegmentsSum, op::v3)
 NGRAPH_OP(ExtractImagePatches, op::v3)
 NGRAPH_OP(ShapeOf, op::v3)
 NGRAPH_OP(NonZero, op::v3)
 NGRAPH_OP(ScatterNDUpdate, op::v3)
 NGRAPH_OP(ScatterUpdate, op::v3)
 #undef ID_SUFFIX
--- a/ngraph/test/runtime/interpreter/reference/scatter_nd_update.hpp
+++ b/ngraph/test/runtime/interpreter/reference/scatter_nd_update.hpp
@ -0,0 +1,63 @@
 // Copyright (C) 2020 Intel Corporation
 // SPDX-License-Identifier: Apache-2.0
 //
 #pragma once
 #include "ngraph/coordinate_transform.hpp"
 #include "ngraph/shape.hpp"
 using namespace ngraph;
 namespace ngraph
 {
    namespace runtime
    {
        namespace reference
        {
            template <typename dataType, typename indicesType>
            void scatterNdUpdate(const dataType* inputData,
                                 const indicesType* indices,
                                 const dataType* updates,
                                 dataType* outBuf,
                                 const Shape& dataShape,
                                 const Shape& indicesShape,
                                 const Shape& updatesShape)
            {
                size_t numSlices = 1;
                size_t sliceSize = 1;
                for (size_t i = 0; i < indicesShape.size() - 1; i++)
                {
                    numSlices *= indicesShape[i];
                }
                for (size_t i = indicesShape.size() - 1; i < updatesShape.size(); i++)
                {
                    sliceSize *= updatesShape[i];
                }
                const size_t k = indicesShape.back();
                std::memcpy(outBuf, inputData, sizeof(dataType) * shape_size(dataShape));
                CoordinateTransform dataTransform{dataShape};
                for (size_t i = 0; i < numSlices; i++)
                {
                    Coordinate coord;
                    for (size_t j = 0; j < k; j++)
                    {
                        coord.push_back(indices[i * k + j]);
                    }
                    for (size_t j = k; j < dataShape.size(); j++)
                    {
                        coord.push_back(0);
                    }
                    const size_t startDataIdx = dataTransform.index(coord);
                    for (size_t j = 0; j < sliceSize; j++)
                    {
                        outBuf[startDataIdx + j] = updates[i * sliceSize + j];
                    }
                }
            }
        } // namespace reference
    }     // namespace runtime
 } // namespace ngraph
--- a/ngraph/test/runtime/interpreter/reference/scatter_update.hpp
+++ b/ngraph/test/runtime/interpreter/reference/scatter_update.hpp
@ -0,0 +1,86 @@
 // Copyright (C) 2020 Intel Corporation
 // SPDX-License-Identifier: Apache-2.0
 //
 #pragma once
 #include <string>
 #include "ngraph/coordinate_transform.hpp"
 #include "ngraph/shape.hpp"
 using namespace ngraph;
 namespace ngraph
 {
    namespace runtime
    {
        namespace reference
        {
            template <typename dataType, typename indicesType, typename axisType>
            void scatterUpdate(const dataType* inputData,
                               const indicesType* indices,
                               const dataType* updates,
                               const axisType* _axis,
                               dataType* outBuf,
                               const Shape& dataShape,
                               const Shape& indicesShape,
                               const Shape& updatesShape)
            {
                int rank = static_cast<int>(dataShape.size());
                if (_axis[0] < -rank || _axis[0] > rank - 1)
                {
                    std::string error =
                        std::string("ScatterUpdate layer has out of bounds axis value: ") +
                        std::to_string(_axis[0]);
                    throw ngraph_error(error);
                }
                size_t axis = _axis[0] < 0 ? _axis[0] + rank : _axis[0];
                CoordinateTransform indicesTransform{indicesShape};
                Shape dataShapeIter = dataShape;
                dataShapeIter.erase(dataShapeIter.begin() + axis);
                CoordinateTransform dataTransfIter{dataShapeIter};
                CoordinateTransform updateTransform{updatesShape};
                CoordinateTransform dataTransform{dataShape};
                std::memcpy(outBuf, inputData, sizeof(dataType) * shape_size(dataShape));
                for (const Coordinate& indicesCoordIt : indicesTransform)
                {
                    const size_t indicesIdx = indicesTransform.index(indicesCoordIt);
                    if (indices[indicesIdx] < 0)
                    {
                        std::string error =
                            std::string("ScatterUpdate layer has negative index value: ") +
                            std::to_string(indices[indicesIdx]);
                        throw ngraph_error(error);
                    }
                    const size_t idx = static_cast<size_t>(indices[indicesIdx]);
                    if (dataShape[axis] <= idx)
                    {
                        std::string error =
                            std::string("ScatterUpdate layer has out of bounds coordinate: ") +
                            std::to_string(idx) + " on 'data' input on " + std::to_string(axis) +
                            "th axis";
                        throw ngraph_error(error);
                    }
                    for (const Coordinate& dataCoordIt : dataTransfIter)
                    {
                        Coordinate dataCoord = dataCoordIt;
                        dataCoord.insert(dataCoord.begin() + axis, idx);
                        const size_t startIndices = dataTransform.index(dataCoord);
                        auto updCoord = dataCoordIt;
                        updCoord.insert(
                            updCoord.begin() + axis, indicesCoordIt.begin(), indicesCoordIt.end());
                        const size_t startUpd = updateTransform.index(updCoord);
                        outBuf[startIndices] = updates[startUpd];
                    }
                }
            }
        } // namespace reference
    }     // namespace runtime
 } // namespace ngraph