auto-batching functional test (with results check vs ref) and GPU instance for that

2021-11-18 14:51:05 +03:00 · 2021-11-18 14:51:05 +03:00 · 8f1067f4f1
commit 8f1067f4f1
parent 2f062d23c7
3 changed files with 141 additions and 1 deletions
--- a/inference-engine/tests/functional/plugin/gpu/CMakeLists.txt
+++ b/inference-engine/tests/functional/plugin/gpu/CMakeLists.txt
@ -12,7 +12,7 @@ addIeTargetTest(
        INCLUDES
            ${CMAKE_CURRENT_SOURCE_DIR}
        DEPENDENCIES
-            clDNNPlugin
+            clDNNPlugin AutoBatchPlugin
        LINK_LIBRARIES
            funcSharedTests
            OpenCL
--- a/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/auto_batching/auto_batching_tests.cpp
+++ b/inference-engine/tests/functional/plugin/gpu/shared_tests_instances/auto_batching/auto_batching_tests.cpp
@ -0,0 +1,18 @@
 // Copyright (C) 2018-2021 Intel Corporation
 // SPDX-License-Identifier: Apache-2.0
 //
 #include <auto_batching/auto_batching_tests.hpp>
 const std::vector<size_t> num_streams{ 1, 2 };
 const std::vector<bool>   get_vs_set{ true, false };
 const std::vector<size_t> num_requests{ 1, 8, 16, 64 };
 const std::vector<size_t> num_batch{ 1, 4, 8, 16, 32, 64, 128, 256 };
 INSTANTIATE_TEST_SUITE_P(smoke_AutoBatching_GPU, AutoBatching_Test,
        ::testing::Combine(
                ::testing::Values(CommonTestUtils::DEVICE_GPU),
                ::testing::ValuesIn(get_vs_set),
                ::testing::ValuesIn(num_streams),
                ::testing::ValuesIn(num_requests),
                ::testing::ValuesIn(num_batch)),
                AutoBatching_Test::getTestCaseName);
--- a/inference-engine/tests/functional/plugin/shared/include/auto_batching/auto_batching_tests.hpp
+++ b/inference-engine/tests/functional/plugin/shared/include/auto_batching/auto_batching_tests.hpp
@ -0,0 +1,122 @@
 // Copyright (C) 2018-2021 Intel Corporation
 // SPDX-License-Identifier: Apache-2.0
 //
 #include <string>
 #include <utility>
 #include <vector>
 #include <memory>
 #include <gpu/gpu_config.hpp>
 #include <common_test_utils/test_common.hpp>
 #include <functional_test_utils/plugin_cache.hpp>
 #include "ngraph_functions/subgraph_builders.hpp"
 #include "functional_test_utils/blob_utils.hpp"
 using namespace ::testing;
 using namespace InferenceEngine;
 using AutoBatchTwoNetsParams = std::tuple<
        std::string,             // device name
        bool,  // get or set blob
        size_t,  // number of streams
        size_t,  // number of requests
        size_t>; // batch size>
 class AutoBatching_Test : public CommonTestUtils::TestsCommon,
                          public testing::WithParamInterface<AutoBatchTwoNetsParams> {
    void SetUp() override {
        std::tie(device_name, use_get_blob, num_streams, num_requests, num_batch) = this->GetParam();
        fn_ptrs = {ngraph::builder::subgraph::makeSingleConv(), ngraph::builder::subgraph::makeMultiSingleConv()};
    };
 public:
    static std::string getTestCaseName(const testing::TestParamInfo<AutoBatchTwoNetsParams>& obj) {
        size_t streams, requests, batch;
        bool use_get_blob;
        std::string device_name;
        std::tie(device_name, use_get_blob, streams, requests, batch) = obj.param;
        return device_name + std::string(use_get_blob ? "_get_blob" : "_set_blob") + "_batch_size_" + std::to_string(batch) +
               "_num_streams_" + std::to_string(streams) + "_num_req_" + std::to_string(requests);
    }
 protected:
    std::string device_name;
    bool   use_get_blob;
    size_t num_streams;
    size_t num_requests;
    size_t num_batch;
    std::vector<std::shared_ptr<ngraph::Function>> fn_ptrs;
 };
 TEST_P(AutoBatching_Test, compareAutoBatchingToBatch1) {
    std::vector<InferenceEngine::CNNNetwork> nets;
    for (auto &fn_ptr : fn_ptrs) {
        nets.push_back(CNNNetwork(fn_ptr));
    }
    auto ie = InferenceEngine::Core();
    std::vector<std::string> outputs;
    std::vector<InferRequest> irs;
    std::vector<std::vector<uint8_t>> ref;
    std::vector<int> outElementsCount;
    for (size_t i = 0; i < nets.size(); ++i) {
        auto net = nets[i];
        net.getInputsInfo().begin()->second->setLayout(Layout::NCHW);
        net.getInputsInfo().begin()->second->setPrecision(Precision::FP32);
        std::map<std::string, std::string> config;
        if (device_name.find("GPU") != std::string::npos)
            config[CONFIG_KEY(GPU_THROUGHPUT_STREAMS)] = std::to_string(num_streams);
        if (device_name.find("CPU") != std::string::npos)
            config[CONFIG_KEY(CPU_THROUGHPUT_STREAMS)] = std::to_string(num_streams);
        auto exec_net_ref = ie.LoadNetwork(net, std::string("BATCH:") +
                                                   device_name + "(" + std::to_string(num_batch) + ")",
                                                   config);
        for (int j = 0; j < num_requests; j++) {
            outputs.push_back(net.getOutputsInfo().begin()->first);
            auto inf_req = exec_net_ref.CreateInferRequest();
            irs.push_back(inf_req);
            auto blob = FuncTestUtils::createAndFillBlob(net.getInputsInfo().begin()->second->getTensorDesc());
            if (use_get_blob)
                InferenceEngine::blob_copy(blob, inf_req.GetBlob(net.getInputsInfo().begin()->first));
            else
                inf_req.SetBlob(net.getInputsInfo().begin()->first, blob);
            outElementsCount.push_back(
                    std::accumulate(begin(fn_ptrs[i]->get_output_shape(0)), end(fn_ptrs[i]->get_output_shape(0)), 1,
                                    std::multiplies<size_t>()));
            const auto inBlob = inf_req.GetBlob(net.getInputsInfo().begin()->first);
            const auto blobSize = inBlob->byteSize();
            const auto inBlobBuf = inBlob->cbuffer().as<uint8_t *>();
            std::vector<uint8_t> inData(inBlobBuf, inBlobBuf + blobSize);
            auto refOutData = ngraph::helpers::interpreterFunction(fn_ptrs[i], {inData}).front().second;
            ref.push_back(refOutData);
        }
    }
    const int niter = 1;
    for (int i = 0; i < niter; i++) {
        for (auto ir : irs) {
            ir.StartAsync();
        }
        for (auto ir : irs) {
            ir.Wait(InferRequest::RESULT_READY);
        }
    }
    auto thr = FuncTestUtils::GetComparisonThreshold(InferenceEngine::Precision::FP32);
    for (size_t i = 0; i < irs.size(); ++i) {
        const auto &refBuffer = ref[i].data();
        ASSERT_EQ(outElementsCount[i], irs[i].GetBlob(outputs[i])->size());
        FuncTestUtils::compareRawBuffers(irs[i].GetBlob(outputs[i])->buffer().as<float *>(),
                                         reinterpret_cast<const float *>(refBuffer), outElementsCount[i],
                                         outElementsCount[i],
                                         thr);
    }
 }