[PT FE ] Add aten::index_put_ operator with layer test (#15668)

2023-02-16 08:28:46 +01:00
parent 70cb829992
commit fab35896cb
4 changed files with 226 additions and 1 deletions
--- a/src/frontends/pytorch/src/op/index_put_.cpp
+++ b/src/frontends/pytorch/src/op/index_put_.cpp
@@ -0,0 +1,124 @@
+// Copyright (C) 2018-2023 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include "openvino/frontend/pytorch/node_context.hpp"
+#include "openvino/op/add.hpp"
+#include "openvino/op/broadcast.hpp"
+#include "openvino/op/concat.hpp"
+#include "openvino/op/constant.hpp"
+#include "openvino/op/convert_like.hpp"
+#include "openvino/op/gather.hpp"
+#include "openvino/op/mod.hpp"
+#include "openvino/op/scatter_nd_update.hpp"
+#include "openvino/op/shape_of.hpp"
+#include "openvino/op/slice.hpp"
+#include "openvino/op/split.hpp"
+#include "openvino/op/unsqueeze.hpp"
+#include "utils.hpp"
+
+namespace ov {
+namespace frontend {
+namespace pytorch {
+namespace op {
+
+using namespace ov::op;
+
+namespace {
+Output<Node> generate_zeros_with_convertlike(const NodeContext& context,
+                                             const Output<Node> sizes,
+                                             const Output<Node> tensor_of_type) {
+    auto const_0 = context.mark_node(v0::Constant::create(element::i32, Shape{}, {0}));
+    auto zeros = context.mark_node(std::make_shared<v3::Broadcast>(const_0, sizes));
+    return context.mark_node(std::make_shared<v1::ConvertLike>(zeros, tensor_of_type));
+}
+}  // namespace
+
+OutputVector translate_index_put_(NodeContext& context) {
+    num_inputs_check(context, 4, 4);
+    auto const_0 = context.mark_node(v0::Constant::create(element::i32, Shape{}, {0}));
+    auto const_1 = context.mark_node(v0::Constant::create(element::i32, Shape{1}, {1}));
+    auto const_max_int =
+        context.mark_node(v0::Constant::create(element::i32, Shape{1}, {std::numeric_limits<int32_t>::max()}));
+    auto const_neg_1 = context.mark_node(v0::Constant::create(element::i32, Shape{}, {-1}));
+
+    auto input = context.get_input(0);
+    auto input_shape = context.mark_node(std::make_shared<v3::ShapeOf>(input, element::i32));
+    auto indices = context.get_input(1);
+    auto values = context.get_input(2);
+    auto accumulate = context.const_input<bool>(3);
+
+    auto indices_partial_shape = indices.get_partial_shape();
+    FRONT_END_OP_CONVERSION_CHECK(indices_partial_shape.rank().is_static(),
+                                  "We support only indices with static rank.");
+    auto indices_first_dim = indices_partial_shape[0];
+    FRONT_END_OP_CONVERSION_CHECK(indices_first_dim.is_static(),
+                                  "We support only lists of tensors with static number of elements.");
+    int64_t indices_list_len = indices_first_dim.get_length();
+    if (indices_list_len == 0) {
+        return {values};
+    }
+
+    auto const_indices_list_len = context.mark_node(v0::Constant::create(element::i32, Shape{1}, {indices_list_len}));
+    auto split_indices = context.mark_node(std::make_shared<v1::Split>(indices, const_0, indices_list_len));
+
+    std::shared_ptr<Node> broadcast_index_shape;
+    Output<Node> index;
+    if (indices_list_len > 1) {
+        index = split_indices->output(0);
+        for (int i = 1; i < indices_list_len; i++) {
+            index = context.mark_node(std::make_shared<v1::Add>(index, split_indices->output(i)));
+        }
+        broadcast_index_shape = context.mark_node(std::make_shared<v3::ShapeOf>(index, element::i32));
+        OutputVector indices_list;
+        for (int i = 0; i < indices_list_len; i++) {
+            auto broadcast =
+                context.mark_node(std::make_shared<v3::Broadcast>(split_indices->output(i), broadcast_index_shape));
+            auto unsqueeze = context.mark_node(std::make_shared<v0::Unsqueeze>(broadcast, const_neg_1));
+
+            // change negative indices to positive indices
+            auto const_i = context.mark_node(v0::Constant::create(element::i32, Shape{}, {i}));
+            auto dim_i = context.mark_node(std::make_shared<v8::Gather>(input_shape, const_i, const_0));
+            auto dim_i_correct_type = context.mark_node(std::make_shared<v1::ConvertLike>(dim_i, index));
+            unsqueeze = context.mark_node(std::make_shared<v1::Add>(unsqueeze, dim_i_correct_type));
+            unsqueeze = context.mark_node(std::make_shared<v1::Mod>(unsqueeze, dim_i_correct_type));
+
+            indices_list.push_back(unsqueeze);
+        }
+        index = context.mark_node(std::make_shared<v0::Concat>(indices_list, -1));
+    } else {
+        index = split_indices->output(0);
+
+        // change negative indices to positive indices
+        auto dim_0 = context.mark_node(std::make_shared<v8::Gather>(input_shape, const_0, const_0));
+        auto dim_0_correct_type = context.mark_node(std::make_shared<v1::ConvertLike>(dim_0, index));
+        index = context.mark_node(std::make_shared<v1::Add>(index, dim_0_correct_type));
+        index = context.mark_node(std::make_shared<v1::Mod>(index, dim_0_correct_type));
+
+        broadcast_index_shape = context.mark_node(std::make_shared<v3::ShapeOf>(index, element::i32));
+        index = context.mark_node(std::make_shared<v0::Unsqueeze>(index, const_neg_1));
+    }
+
+    auto sub_data_shape =
+        context.mark_node(std::make_shared<v8::Slice>(input_shape, const_indices_list_len, const_max_int, const_1));
+    auto values_shape =
+        context.mark_node(std::make_shared<v0::Concat>(OutputVector{broadcast_index_shape, sub_data_shape}, 0));
+    values = context.mark_node(std::make_shared<v3::Broadcast>(values, values_shape));
+    values = context.mark_node(std::make_shared<v1::ConvertLike>(values, input));
+
+    Output<Node> result;
+    if (accumulate) {
+        auto zeros = generate_zeros_with_convertlike(context, input_shape, input);
+        result = context.mark_node(std::make_shared<v3::ScatterNDUpdate>(zeros, index, values));
+        result = context.mark_node(std::make_shared<v1::Add>(input, result));
+    } else {
+        result = context.mark_node(std::make_shared<v3::ScatterNDUpdate>(input, index, values));
+    }
+
+    return {result};
+};
+
+}  // namespace op
+}  // namespace pytorch
+}  // namespace frontend
+}  // namespace ov
--- a/src/frontends/pytorch/src/op/list_construct.cpp
+++ b/src/frontends/pytorch/src/op/list_construct.cpp
@@ -5,6 +5,7 @@
 #include "openvino/frontend/pytorch/node_context.hpp"
 #include "openvino/op/concat.hpp"
 #include "openvino/op/constant.hpp"
+#include "openvino/op/unsqueeze.hpp"
 #include "utils.hpp"

 namespace ov {
@@ -16,6 +17,7 @@ using namespace ov::op;

 OutputVector translate_list_construct(NodeContext& context) {
    // Process the case when prim::ListConstruct has all inputs constant
+    auto const_0 = context.mark_node(v0::Constant::create(element::i32, Shape{}, {0}));
    ov::OutputVector consts;
    for (size_t i = 0; i < context.get_input_size(); i++) {
        auto input = context.get_input_from_visible_context(i);
@@ -23,8 +25,11 @@ OutputVector translate_list_construct(NodeContext& context) {
        FRONT_END_OP_CONVERSION_CHECK(c_node, "Translation for prim::ListConstruct support only constant inputs");
        if (c_node->get_shape().size() == 0) {
            c_node = std::make_shared<v0::Constant>(c_node->get_element_type(), Shape{1}, c_node->get_data_ptr());
+            consts.push_back(c_node);
+        } else {
+            auto unsqueezed_c_node = context.mark_node(std::make_shared<v0::Unsqueeze>(c_node, const_0));
+            consts.push_back(unsqueezed_c_node);
        }
-        consts.push_back(c_node);
    }
    auto list_construct = std::make_shared<v0::Concat>(consts, 0);
    if (list_construct->has_evaluate()) {
--- a/src/frontends/pytorch/src/op_table.cpp
+++ b/src/frontends/pytorch/src/op_table.cpp
@@ -53,6 +53,7 @@ OP_CONVERTER(translate_group_norm);
 OP_CONVERTER(translate_hardtanh);
 OP_CONVERTER(translate_if);
 OP_CONVERTER(translate_im2col);
+OP_CONVERTER(translate_index_put_);
 OP_CONVERTER(translate_instance_norm);
 OP_CONVERTER(translate_int);
 OP_CONVERTER(translate_layer_norm);
@@ -208,6 +209,7 @@ const std::map<std::string, CreatorFunction> get_supported_ops() {
        {"aten::hardtanh", op::translate_hardtanh},
        {"aten::hardtanh_", op::inplace_op<op::translate_hardtanh>},
        {"aten::im2col", op::translate_im2col},
+        {"aten::index_put_", op::inplace_op<op::translate_index_put_>},
        {"aten::instance_norm", op::translate_instance_norm},
        {"aten::Int", op::translate_int},
        {"aten::IntImplicit", op::translate_int},
--- a/tests/layer_tests/pytorch_tests/test_index_put_.py
+++ b/tests/layer_tests/pytorch_tests/test_index_put_.py
@@ -0,0 +1,94 @@
+# Copyright (C) 2018-2023 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+
+import numpy as np
+import pytest
+import torch
+
+from pytorch_layer_test_class import PytorchLayerTest
+
+
+class TestIndexPut_SingleIndices(PytorchLayerTest):
+    def _prepare_input(self):
+        return (self.input_tensor, self.values)
+
+    def create_model(self, indices, accumulate):
+
+        class aten_index_put_(torch.nn.Module):
+
+            def __init__(self, indices, accumulate):
+                super().__init__()
+                self.indices = indices
+                self.accumulate = accumulate
+
+            def forward(self, input_tensor, values):
+                input_tensor.index_put_((self.indices,), values, self.accumulate)
+                return input_tensor
+
+        ref_net = None
+
+        return aten_index_put_(indices, accumulate), ref_net, "aten::index_put_"
+
+    @pytest.mark.parametrize('input_data', ({'input_tensor': np.random.randn(5).astype(np.float32),
+                                             'values': np.array(11).astype(np.float32)},
+                                             {'input_tensor': np.random.randn(3, 3).astype(np.float32),
+                                             'values': np.array([10, 11, 12]).astype(np.float32)}))
+    @pytest.mark.parametrize('indices', (torch.tensor([0], dtype=torch.long),
+                                         torch.tensor([-1, -2], dtype=torch.long),
+                                         torch.tensor([0, -1, -2], dtype=torch.long),
+                                         torch.tensor([1, 2], dtype=torch.long),
+                                         torch.tensor([0, 1, 2], dtype=torch.long)))
+    @pytest.mark.parametrize('accumulate', (True, False))
+    @pytest.mark.nightly
+    @pytest.mark.precommit
+    def test_index_put_single_indices(self, ie_device, precision, ir_version, input_data, indices, accumulate):
+        self.input_tensor = input_data['input_tensor']
+        self.values = input_data['values']
+        self._test(*self.create_model(indices, accumulate), ie_device, precision, ir_version)
+
+class TestIndexPut_ManyIndices(PytorchLayerTest):
+    def _prepare_input(self):
+        return (self.input_tensor, self.values)
+
+    def create_model(self, indices, accumulate):
+
+        class aten_index_put_(torch.nn.Module):
+
+            def __init__(self, indices, accumulate):
+                super().__init__()
+                self.indices_first = indices[0]
+                self.indices_second = indices[1]
+                self.accumulate = accumulate
+
+            def forward(self, input_tensor, values):
+                input_tensor.index_put_((self.indices_first, self.indices_second), values, self.accumulate)
+                return input_tensor
+
+        ref_net = None
+
+        return aten_index_put_(indices, accumulate), ref_net, "aten::index_put_"
+
+    @pytest.mark.parametrize('input_data', ({'input_tensor': np.random.randn(3, 3).astype(np.float32),
+                                             'values': np.array(12).astype(np.float32)},
+                                             {'input_tensor': np.random.randn(3, 3, 3).astype(np.float32),
+                                             'values': np.array([10, 11, 12]).astype(np.float32)},))
+    @pytest.mark.parametrize('indices', ((torch.tensor([0], dtype=torch.long),
+                                          torch.tensor([2], dtype=torch.long)),
+                                         (torch.tensor([1, 2], dtype=torch.long),
+                                          torch.tensor([0, 1], dtype=torch.long)),
+                                         (torch.tensor([0, 1], dtype=torch.long),
+                                          torch.tensor([0, 1], dtype=torch.long)),
+                                          (torch.tensor([0], dtype=torch.long),
+                                          torch.tensor([-2], dtype=torch.long)),
+                                         (torch.tensor([-1, -2], dtype=torch.long),
+                                          torch.tensor([0, 1], dtype=torch.long)),
+                                         (torch.tensor([0, -1], dtype=torch.long),
+                                          torch.tensor([0, -1], dtype=torch.long))))
+    @pytest.mark.parametrize('accumulate', (True, False))
+    @pytest.mark.nightly
+    @pytest.mark.precommit
+    def test_index_put_many_indices(self, ie_device, precision, ir_version, input_data, indices, accumulate):
+        self.input_tensor = input_data['input_tensor']
+        self.values = input_data['values']
+        self._test(*self.create_model(indices, accumulate), ie_device, precision, ir_version)