disabling auto-batching when batch<4 (as batch1 kernels are heavily optimized) (#10188)

2022-02-09 12:02:30 +03:00 · 2022-02-09 12:02:30 +03:00 · 320c64de24
commit 320c64de24
parent 04194b292d
1 changed files with 2 additions and 1 deletions
--- a/src/plugins/auto_batch/auto_batch.cpp
+++ b/src/plugins/auto_batch/auto_batch.cpp
@ -746,7 +746,8 @@ InferenceEngine::IExecutableNetworkInternal::Ptr AutoBatchInferencePlugin::LoadN
            requests = static_cast<unsigned int>(PerfHintsConfig::CheckPerformanceHintRequestValue(reqs->second));
        if (requests)
            optBatchSize = std::max(1u, std::min(requests, optimalBatchSize));
-        metaDevice.batchForDevice = optBatchSize;
+        if (optBatchSize > 2)  // batching is usually in-efficient for batch<4 (as batch1 kernels are heavily optimized)
+            metaDevice.batchForDevice = optBatchSize;
    }

    const auto perfConfig = fullConfig.find(PluginConfigParams::KEY_PERF_COUNT);