[GPU] Enable broadcast transition pass (#17172)

2023-04-25 09:04:37 +04:00 · 2023-04-25 09:04:37 +04:00 · d1f1fa2b39
commit d1f1fa2b39
parent 3bb0fb61f6
2 changed files with 114 additions and 0 deletions
--- a/src/plugins/intel_gpu/src/plugin/transformations_pipeline.cpp
+++ b/src/plugins/intel_gpu/src/plugin/transformations_pipeline.cpp
@ -45,6 +45,7 @@
 #include <transformations/common_optimizations/wrap_interpolate_into_transposes.hpp>
 #include <transformations/common_optimizations/transpose_sinking.hpp>
 #include <transformations/common_optimizations/softmax_fusion.hpp>
+#include <transformations/common_optimizations/broadcast_transition.hpp>

 #include <transformations/op_conversions/convert_depth_to_space.hpp>
 #include <transformations/op_conversions/convert_space_to_depth.hpp>
@ -196,6 +197,7 @@ void TransformationsPipeline::apply(std::shared_ptr<ov::Model> func) {
        manager.register_pass<ov::pass::SoftmaxFusion>();
        // decompose MVNs that sre not supported in GPU, so the they will be marked as precision sensitive in ConvertPrecision
        manager.register_pass<ov::pass::MVN6Decomposition>();
+        manager.register_pass<ov::pass::BroadcastTransition>();

        //  call ConvertPrecision with keep_precision_sensitive_in_fp32 = true
        manager.register_pass<ov::pass::ConvertPrecision>(fp_convert_precision_map, empty_fuse_map, true);
--- a/src/tests/functional/plugin/gpu/subgraph_tests/dynamic/broadcast_eltwise.cpp
+++ b/src/tests/functional/plugin/gpu/subgraph_tests/dynamic/broadcast_eltwise.cpp
@ -0,0 +1,112 @@
+// Copyright (C) 2023 Intel Corporation
+// SPDX-License-Identifier: Apache-2.0
+//
+
+#include <openvino/opsets/opset1.hpp>
+#include <common_test_utils/ov_tensor_utils.hpp>
+
+#include "ngraph_functions/builders.hpp"
+#include "ngraph_functions/utils/ngraph_helpers.hpp"
+#include "shared_test_classes/base/layer_test_utils.hpp"
+#include "shared_test_classes/base/ov_subgraph.hpp"
+#include "openvino/pass/serialize.hpp"
+
+using namespace ngraph;
+using namespace ov::test;
+using namespace InferenceEngine;
+
+namespace GPULayerTestsDefinitions {
+using BroadcastEltwiseParams = std::tuple<
+    ElementType, // input precision
+    InputShape,  // input shape
+    ov::Shape    // target broadcast shape
+>;
+
+class BroadcastEltwise : virtual public SubgraphBaseTest, public testing::WithParamInterface<BroadcastEltwiseParams> {
+public:
+    static std::string getTestCaseName(const testing::TestParamInfo<BroadcastEltwiseParams>& obj) {
+        ElementType input_precision;
+        InputShape input_shape;
+        ov::Shape target_shape;
+        std::tie(input_precision, input_shape, target_shape) = obj.param;
+
+        std::ostringstream result;
+        result << "precision=" << input_precision << "IS=(" << CommonTestUtils::partialShape2str({input_shape.first}) << ")_TS=(";
+        for (const auto& item : input_shape.second) {
+            result << CommonTestUtils::vec2str(item) << "_";
+        }
+        result << ")_target_shape=" << CommonTestUtils::vec2str(target_shape);
+        return result.str();
+    }
+
+protected:
+    void SetUp() override {
+        ElementType input_precision;
+        InputShape input_shape;
+        std::tie(input_precision, input_shape, target_shape) = GetParam();
+        targetDevice = CommonTestUtils::DEVICE_GPU;
+
+        std::vector<InputShape> input_shapes{input_shape, {{}, {{target_shape.size()}}}};
+        init_input_shapes(input_shapes);
+
+        ov::element::TypeVector input_precisions{input_precision, ov::element::i64};
+        const auto params = ngraph::builder::makeDynamicParams(input_precisions, inputDynamicShapes);
+        const auto bcast_data = ov::opset10::Constant::create(input_precision, {}, {1.f});
+        const auto bcast = std::make_shared<ov::opset10::Broadcast>(bcast_data, params[1]);
+        const auto add = std::make_shared<ov::opset10::Add>(params[0], bcast);
+        function = std::make_shared<ov::Model>(add, params);
+    }
+
+    void generate_inputs(const std::vector<ov::Shape>& targetInputStaticShapes) override {
+        inputs.clear();
+        const auto& funcInputs = function->inputs();
+        auto data_tensor = ov::test::utils::create_and_fill_tensor(funcInputs[0].get_element_type(), targetInputStaticShapes[0]);
+        inputs.insert({funcInputs[0].get_node_shared_ptr(), data_tensor});
+
+        auto shape_tensor = ov::Tensor{ov::element::i64, targetInputStaticShapes[1]};
+        auto data = shape_tensor.data<ov::element_type_traits<ov::element::i64>::value_type>();
+        for (size_t i = 0; i < target_shape.size(); i++) {
+            data[i] = target_shape[i];
+        }
+        inputs.insert({funcInputs[1].get_node_shared_ptr(), shape_tensor});
+    }
+
+    ov::Shape target_shape;
+};
+
+TEST_P(BroadcastEltwise, smoke_CompareWithRefs) {
+    run();
+
+    const auto model = compiledModel.get_runtime_model();
+
+    const auto last_node = model->get_result()->get_input_node_shared_ptr(0);
+    const auto& last_rt_info = last_node->get_rt_info();
+    const auto last_layer_type = last_rt_info.find("layerType")->second.as<std::string>();
+    EXPECT_EQ(last_layer_type, "Reorder");
+
+    // Check that BroadcastTransition transformation was applied and broadcast is after eltwise now.
+    const auto last_node_input = last_node->get_input_node_shared_ptr(0);
+    const auto& last_input_rt_info = last_node_input->get_rt_info();
+    const auto last_input_layer_type = last_input_rt_info.find("layerType")->second.as<std::string>();
+    EXPECT_EQ(last_input_layer_type, "broadcast");
+}
+
+namespace {
+const std::vector<InputShape> input_shapes = {
+    {{-1, -1, -1, -1}, {{1, 3, 16, 16}}},
+    {{-1, -1}, {{16, 16}}},
+};
+
+const std::vector<ov::Shape> target_shapes = {
+    {1, 3, 16, 1},
+    {16, 16},
+};
+
+INSTANTIATE_TEST_SUITE_P(smoke_BroadcastEltwise,
+                         BroadcastEltwise,
+                         ::testing::Combine(::testing::Values(ov::element::f16),
+                                            ::testing::ValuesIn(input_shapes),
+                                            ::testing::ValuesIn(target_shapes)),
+                         BroadcastEltwise::getTestCaseName);
+} // namespace
+} // namespace GPULayerTestsDefinitions