Removed legacy methods SetBatch and SetBlob (#17984)

* Removed legacy methods SetBatch and SetBlob * Fixed GPU plugin build * Remove DYN_BATCH_LIMIT from tests * Revert some changes in GPU plugin
2023-06-12 22:54:23 +04:00 · 2023-06-12 22:54:23 +04:00 · 0743e9bfb5
commit 0743e9bfb5
parent df44f92a97
47 changed files with 18 additions and 708 deletions
--- a/samples/cpp/hello_query_device/README.md
+++ b/samples/cpp/hello_query_device/README.md
@ -67,8 +67,6 @@ The application prints all available devices with their supported metrics and de
   [ INFO ]                CPU_THREADS_NUM : 0
   [ INFO ]                CPU_THROUGHPUT_STREAMS : 1
   [ INFO ]                DUMP_EXEC_GRAPH_AS_DOT : ""
-   [ INFO ]                DYN_BATCH_ENABLED : NO
-   [ INFO ]                DYN_BATCH_LIMIT : 0
   [ INFO ]                ENFORCE_BF16 : NO
   [ INFO ]                EXCLUSIVE_ASYNC_REQUESTS : NO
   [ INFO ]                PERFORMANCE_HINT : ""
--- a/samples/python/hello_query_device/README.md
+++ b/samples/python/hello_query_device/README.md
@ -62,8 +62,6 @@ For example:
   [ INFO ]                CPU_THREADS_NUM: 0
   [ INFO ]                CPU_THROUGHPUT_STREAMS: 1
   [ INFO ]                DUMP_EXEC_GRAPH_AS_DOT:
-   [ INFO ]                DYN_BATCH_ENABLED: NO
-   [ INFO ]                DYN_BATCH_LIMIT: 0
   [ INFO ]                ENFORCE_BF16: NO
   [ INFO ]                EXCLUSIVE_ASYNC_REQUESTS: NO
   [ INFO ]                PERFORMANCE_HINT:
--- a/src/inference/dev_api/cpp_interfaces/impl/ie_infer_async_request_thread_safe_default.hpp
+++ b/src/inference/dev_api/cpp_interfaces/impl/ie_infer_async_request_thread_safe_default.hpp
@ -240,11 +240,6 @@ public:
        _syncRequest->SetBlob(name, data);
    }

-    void SetBlob(const std::string& name, const Blob::Ptr& data, const PreProcessInfo& info) override {
-        CheckState();
-        _syncRequest->SetBlob(name, data, info);
-    }
-
    void SetBlobs(const std::string& name, const std::vector<Blob::Ptr>& blobs) override {
        CheckState();
        _syncRequest->SetBlobs(name, blobs);
@ -264,13 +259,6 @@ public:
        return _syncRequest->GetPreProcess(name);
    }

-    OPENVINO_SUPPRESS_DEPRECATED_START
-    void SetBatch(int batch) override {
-        CheckState();
-        _syncRequest->SetBatch(batch);
-    };
-    OPENVINO_SUPPRESS_DEPRECATED_END
-
    void SetCallback(Callback callback) override {
        CheckState();
        _callback = std::move(callback);
--- a/src/inference/dev_api/cpp_interfaces/interface/ie_iinfer_request_internal.hpp
+++ b/src/inference/dev_api/cpp_interfaces/interface/ie_iinfer_request_internal.hpp
@ -131,15 +131,6 @@ public:
     */
    virtual BatchedBlob::Ptr GetBlobs(const std::string& name);

-    /**
-     * @brief Sets pre-process for input data
-     * @param name Name of input blob.
-     * @param data - a reference to input or output blob. The type of Blob must correspond to the network input
-     * precision and size.
-     * @param info Preprocess info for blob.
-     */
-    virtual void SetBlob(const std::string& name, const Blob::Ptr& data, const PreProcessInfo& info);
-
    /**
     * @brief Gets pre-process for input data
     * @param name Name of input blob.
@ -147,14 +138,6 @@ public:
     */
    virtual const PreProcessInfo& GetPreProcess(const std::string& name) const;

-    /**
-     * @brief Sets new batch size when dynamic batching is enabled in executable network that created this request.
-     * @deprecated
-     * @param batch - new batch size to be used by all the following inference calls for this request.
-     */
-    INFERENCE_ENGINE_DEPRECATED("This method is deprecated and will be removed in 2023.1 release")
-    virtual void SetBatch(int batch);
-
    /**
     * @brief Queries memory states.
     * @return Returns memory states
@ -347,7 +330,6 @@ protected:
    std::vector<std::shared_ptr<const ov::Node>> _results;     //!< A vector of function outputs
    std::map<std::string, PreProcessDataPtr> _preProcData;     //!< A map of pre-process data per input
    std::map<std::string, BatchedBlob::Ptr> _batched_inputs;   //!< A map of user passed blobs for network inputs
-    int m_curBatch = -1;                                       //!< Current batch value used in dynamic batching

    /**
     * @brief A shared pointer to IInferRequestInternal
--- a/src/inference/include/ie/cpp/ie_infer_request.hpp
+++ b/src/inference/include/ie/cpp/ie_infer_request.hpp
@ -118,17 +118,6 @@ public:
     */
    Blob::Ptr GetBlob(const std::string& name);

-    /**
-     * @deprecated This method will be removed in 2023.1 release
-     * @brief Sets blob with a pre-process information
-     * @note Returns an error in case if data blob is output
-     * @param name Name of input blob.
-     * @param data A reference to input. The type of Blob must correspond to the network input precision and size.
-     * @param info Preprocess info for blob.
-     */
-    INFERENCE_ENGINE_DEPRECATED("This method is deprecated and will be removed in 2023.1 release")
-    void SetBlob(const std::string& name, const Blob::Ptr& data, const PreProcessInfo& info);
-
    /**
     * @brief Gets pre-process for input data
     * @param name Name of input blob.
@ -175,15 +164,6 @@ public:
     */
    void SetOutput(const BlobMap& results);

-    /**
-     * @brief Sets new batch size when dynamic batching is enabled in executable network that created this request.
-     * @deprecated
-     *
-     * @param batch new batch size to be used by all the following inference calls for this request.
-     */
-    INFERENCE_ENGINE_DEPRECATED("This method is deprecated and will be removed in 2023.1 release")
-    void SetBatch(const int batch);
-
    /**
     * @brief Start inference of specified input(s) in asynchronous mode
     *
--- a/src/inference/include/ie/ie_iinfer_request.hpp
+++ b/src/inference/include/ie/ie_iinfer_request.hpp
@ -85,21 +85,6 @@ public:
     */
    virtual StatusCode GetBlob(const char* name, Blob::Ptr& data, ResponseDesc* resp) noexcept = 0;

-    /**
-     * @deprecated This method will be removed in 2023.1 release
-     * @brief Sets pre-process for input data
-     * @param name Name of input blob.
-     * @param data Reference to input or output blob. The type of Blob must match the network input precision and size.
-     * @param info Preprocess info for blob.
-     * @param resp Optional: pointer to an already allocated object to contain information in case of failure
-     * @return Status code of the operation: OK (0) for success
-     */
-    INFERENCE_ENGINE_DEPRECATED("This method is deprecated and will be removed in 2023.1 release")
-    virtual StatusCode SetBlob(const char* name,
-                               const Blob::Ptr& data,
-                               const PreProcessInfo& info,
-                               ResponseDesc* resp) noexcept = 0;
-
    /**
     * @brief Gets pre-process for input data
     * @param name Name of input blob.
@ -200,18 +185,6 @@ public:
     */
    virtual StatusCode SetUserData(void* data, ResponseDesc* resp) noexcept = 0;

-    /**
-     * @brief Sets new batch size when dynamic batching is enabled in executable network that created this request.
-     *
-     * @deprecated
-     * @param batch_size new batch size to be used by all the following inference calls for this request.
-     * @param resp Optional: a pointer to an already allocated object to contain extra information of a failure (if
-     * occurred)
-     * @return Enumeration of the resulted action: InferenceEngine::OK (0) for success
-     */
-    INFERENCE_ENGINE_DEPRECATED("This method is deprecated and will be removed in 2023.1 release")
-    virtual InferenceEngine::StatusCode SetBatch(int batch_size, ResponseDesc* resp) noexcept = 0;
-
 protected:
    virtual ~IInferRequest() = default;
 };
--- a/src/inference/include/ie/ie_plugin_config.hpp
+++ b/src/inference/include/ie/ie_plugin_config.hpp
@ -405,30 +405,6 @@ DECLARE_CONFIG_VALUE(CPU_THROUGHPUT_AUTO);
 INFERENCE_ENGINE_1_0_DEPRECATED
 DECLARE_CONFIG_KEY(PERF_COUNT);

-/**
- * @brief The key defines dynamic limit of batch processing.
- * @deprecated
- *
- * Specified value is applied to all following Infer() calls. Inference Engine processes
- * min(batch_limit, original_batch_size) first pictures from input blob. For example, if input
- * blob has sizes 32x3x224x224 after applying plugin.SetConfig({KEY_DYN_BATCH_LIMIT, 10})
- * Inference Engine primitives processes only beginner subblobs with size 10x3x224x224.
- * This value can be changed before any Infer() call to specify a new batch limit.
- *
- * The paired parameter value should be convertible to integer number. Acceptable values:
- * -1 - Do not limit batch processing
- * >0 - Direct value of limit. Batch size to process is min(new batch_limit, original_batch)
- */
-INFERENCE_ENGINE_DEPRECATED("This config is deprecated and will be removed in 2023.1 release")
-DECLARE_CONFIG_KEY(DYN_BATCH_LIMIT);
-
-/**
- * @brief The key checks whether dynamic batch is enabled.
- * @deprecated
- */
-INFERENCE_ENGINE_DEPRECATED("This config is deprecated and will be removed in 2023.1 release")
-DECLARE_CONFIG_KEY(DYN_BATCH_ENABLED);
-
 /**
 * @brief This key directs the plugin to load a configuration file.
 *
--- a/src/inference/src/cpp/ie_infer_async_request_base.hpp
+++ b/src/inference/src/cpp/ie_infer_async_request_base.hpp
@ -134,10 +134,6 @@ public:
        TO_STATUS(_impl->SetBlob(name, data));
    }

-    StatusCode SetBlob(const char* name, const Blob::Ptr& data, const PreProcessInfo& info, ResponseDesc* resp) noexcept override {
-        TO_STATUS(_impl->SetBlob(name, data, info));
-    }
-
    StatusCode GetBlob(const char* name, Blob::Ptr& data, ResponseDesc* resp) noexcept override {
        TO_STATUS(data = _impl->GetBlob(name));
    }
@ -181,10 +177,6 @@ public:
    StatusCode SetUserData(void* data, ResponseDesc* resp) noexcept override {
        TO_STATUS(_impl->SetUserData(data));
    }
-
-    StatusCode SetBatch(int batch_size, ResponseDesc* resp) noexcept override {
-        TO_STATUS(_impl->SetBatch(batch_size));
-    }
 };

 IE_SUPPRESS_DEPRECATED_END
--- a/src/inference/src/cpp/ie_infer_request.cpp
+++ b/src/inference/src/cpp/ie_infer_request.cpp
@ -58,10 +58,6 @@ Blob::Ptr InferRequest::GetBlob(const std::string& name) {
    return blobPtr;
 }

-void InferRequest::SetBlob(const std::string& name, const Blob::Ptr& data, const PreProcessInfo& info) {
-    INFER_REQ_CALL_STATEMENT(_impl->SetBlob(name, data, info);)
-}
-
 const PreProcessInfo& InferRequest::GetPreProcess(const std::string& name) const {
    INFER_REQ_CALL_STATEMENT(return _impl->GetPreProcess(name);)
 }
@ -86,10 +82,6 @@ void InferRequest::SetOutput(const BlobMap& results) {
    INFER_REQ_CALL_STATEMENT(for (auto&& result : results) { _impl->SetBlob(result.first, result.second); })
 }

-void InferRequest::SetBatch(const int batch) {
-    INFER_REQ_CALL_STATEMENT(_impl->SetBatch(batch);)
-}
-
 void InferRequest::StartAsync() {
    INFER_REQ_CALL_STATEMENT(_impl->StartAsync();)
 }
--- a/src/inference/src/cpp_interfaces/interface/ie_iinfer_request_internal.cpp
+++ b/src/inference/src/cpp_interfaces/interface/ie_iinfer_request_internal.cpp
@ -407,18 +407,6 @@ BatchedBlob::Ptr IInferRequestInternal::GetBlobs(const std::string& name) {
    return nullptr;
 }

-void IInferRequestInternal::SetBlob(const std::string& name, const Blob::Ptr& data, const PreProcessInfo& info) {
-    InputInfo::Ptr foundInput;
-    DataPtr foundOutput;
-    if (findInputAndOutputBlobByName(name, foundInput, foundOutput)) {
-        foundInput->getPreProcess() = copyPreProcess(info);
-    } else {
-        IE_THROW() << "Pre-process can't be set to output blob";
-    }
-
-    SetBlob(name, data);
-}
-
 const PreProcessInfo& IInferRequestInternal::GetPreProcess(const std::string& name) const {
    InputInfo::Ptr foundInput;
    DataPtr foundOutput;
@ -429,10 +417,6 @@ const PreProcessInfo& IInferRequestInternal::GetPreProcess(const std::string& na
    }
 }

-void IInferRequestInternal::SetBatch(int batch) {
-    IE_THROW(NotImplemented);
-}
-
 std::vector<std::shared_ptr<IVariableStateInternal>> IInferRequestInternal::QueryState() {
    IE_THROW(NotImplemented);
 }
@ -460,7 +444,7 @@ void IInferRequestInternal::execDataPreprocessing(InferenceEngine::BlobMap& prep
        // using preconfigured resize algorithm.
        auto it = _preProcData.find(input.first);
        if (it != _preProcData.end()) {
-            it->second->execute(input.second, _networkInputs[input.first]->getPreProcess(), serial, m_curBatch);
+            it->second->execute(input.second, _networkInputs[input.first]->getPreProcess(), serial, -1);
        }
    }
 }
--- a/src/inference/src/dev/converter_utils.cpp
+++ b/src/inference/src/dev/converter_utils.cpp
@ -541,20 +541,10 @@ public:
        return std::make_shared<InferenceEngine::BatchedBlob>(blobs);
    }

-    void SetBlob(const std::string& name,
-                 const InferenceEngine::Blob::Ptr& data,
-                 const InferenceEngine::PreProcessInfo& info) override {
-        OPENVINO_NOT_IMPLEMENTED;
-    }
-
    const InferenceEngine::PreProcessInfo& GetPreProcess(const std::string& name) const override {
        OPENVINO_NOT_IMPLEMENTED;
    }

-    void SetBatch(int batch) override {
-        OPENVINO_NOT_IMPLEMENTED;
-    }
-
    std::vector<std::shared_ptr<InferenceEngine::IVariableStateInternal>> QueryState() override {
        auto res = m_request->query_state();
        std::vector<std::shared_ptr<InferenceEngine::IVariableStateInternal>> ret;
--- a/src/inference/tests/functional/async_infer_request_test.cpp
+++ b/src/inference/tests/functional/async_infer_request_test.cpp
@ -23,13 +23,6 @@ TEST(InferRequestCPPTests, throwsOnUninitializedGetBlob) {
    ASSERT_THROW(req.GetBlob({}), InferenceEngine::NotAllocated);
 }

-TEST(InferRequestCPPTests, throwsOnUninitializedSetBlobPreproc) {
-    InferRequest req;
-    IE_SUPPRESS_DEPRECATED_START
-    ASSERT_THROW(req.SetBlob({}, {}, {}), InferenceEngine::NotAllocated);
-    IE_SUPPRESS_DEPRECATED_END
-}
-
 TEST(InferRequestCPPTests, throwsOnUninitializedGetPreProcess) {
    InferRequest req;
    ASSERT_THROW(req.GetPreProcess({}), InferenceEngine::NotAllocated);
@ -55,13 +48,6 @@ TEST(InferRequestCPPTests, throwsOnUninitializedSetOutput) {
    ASSERT_THROW(req.SetOutput({{}}), InferenceEngine::NotAllocated);
 }

-TEST(InferRequestCPPTests, throwsOnUninitializedSetBatch) {
-    InferRequest req;
-    IE_SUPPRESS_DEPRECATED_START
-    ASSERT_THROW(req.SetBatch({}), InferenceEngine::NotAllocated);
-    IE_SUPPRESS_DEPRECATED_END
-}
-
 TEST(InferRequestCPPTests, throwsOnUninitializedStartAsync) {
    InferRequest req;
    ASSERT_THROW(req.StartAsync(), InferenceEngine::NotAllocated);
--- a/src/plugins/auto/src/infer_request.cpp
+++ b/src/plugins/auto/src/infer_request.cpp
@ -110,15 +110,6 @@ void MultiDeviceInferRequest::SetBlob(const std::string& name, const InferenceEn
        IInferRequestInternal::SetBlob(name, blob);
 }

-IE_SUPPRESS_DEPRECATED_START
-void MultiDeviceInferRequest::SetBlob(const std::string& name, const Blob::Ptr& blob, const PreProcessInfo& info) {
-    if (_sharedRequest)
-        _sharedRequest->SetBlob(name, blob, info);
-    else
-        IInferRequestInternal::SetBlob(name, blob, info);
-}
-IE_SUPPRESS_DEPRECATED_END
-
 InferenceEngine::Blob::Ptr MultiDeviceInferRequest::GetBlob(const std::string& name) {
    if (_sharedRequest)
        return _sharedRequest->GetBlob(name);
--- a/src/plugins/auto/src/infer_request.hpp
+++ b/src/plugins/auto/src/infer_request.hpp
@ -39,13 +39,6 @@ public:
                                     InferenceEngine::RemoteContext::Ptr ctx = nullptr);
    std::map<std::string, InferenceEngine::InferenceEngineProfileInfo> GetPerformanceCounts() const override;
    void SetBlob(const std::string& name, const InferenceEngine::Blob::Ptr& blob) override;
-    /**
-     * @deprecated This method will be removed in 2024.1 release
-     * @brief Sets blob with a pre-process information
-     */
-    void SetBlob(const std::string& name,
-                 const InferenceEngine::Blob::Ptr& blob,
-                 const InferenceEngine::PreProcessInfo& info) override;
    InferenceEngine::Blob::Ptr GetBlob(const std::string& name) override;
    std::vector<std::shared_ptr<InferenceEngine::IVariableStateInternal>> QueryState() override;
    // Multi-Device impl specific: sets the data (blobs from the device-less requests to the specific device request)
--- a/src/plugins/hetero/infer_request.cpp
+++ b/src/plugins/hetero/infer_request.cpp
@ -102,14 +102,6 @@ InferenceEngine::Blob::Ptr HeteroInferRequest::GetBlob(const std::string& name)
    return itRequest->second->GetBlob(name);
 }

-void HeteroInferRequest::SetBlob(const std::string& name, const Blob::Ptr& blob, const PreProcessInfo& info) {
-    auto itRequest = _subRequestFromBlobName.find(name);
-    if (itRequest == _subRequestFromBlobName.end()) {
-        IE_THROW() << "There is no infer requests binded to blob with name: " << name;
-    }
-    itRequest->second->SetBlob(name, blob, info);
-}
-
 const InferenceEngine::PreProcessInfo& HeteroInferRequest::GetPreProcess(const std::string& name) const {
    auto itRequest = _subRequestFromBlobName.find(name);
    if (itRequest == _subRequestFromBlobName.end()) {
--- a/src/plugins/hetero/infer_request.hpp
+++ b/src/plugins/hetero/infer_request.hpp
@ -44,10 +44,6 @@ public:

    InferenceEngine::Blob::Ptr GetBlob(const std::string& name) override;

-    void SetBlob(const std::string& name,
-                 const InferenceEngine::Blob::Ptr& blob,
-                 const InferenceEngine::PreProcessInfo& info) override;
-
    const InferenceEngine::PreProcessInfo& GetPreProcess(const std::string& name) const override;

    std::vector<std::shared_ptr<InferenceEngine::IVariableStateInternal>> QueryState() override;
--- a/src/plugins/intel_cpu/src/config.cpp
+++ b/src/plugins/intel_cpu/src/config.cpp
@ -118,17 +118,6 @@ void Config::readProperties(const std::map<std::string, std::string> &prop) {
                IE_THROW() << "Wrong value " << val << "for property key " << ov::hint::enable_hyper_threading.name()
                           << ". Expected only true/false." << std::endl;
            }
-        } else if (key == PluginConfigParams::KEY_DYN_BATCH_LIMIT) {
-            int val_i = -1;
-            try {
-                val_i = std::stoi(val);
-            } catch (const std::exception&) {
-                IE_THROW() << "Wrong value for property key " << PluginConfigParams::KEY_DYN_BATCH_LIMIT
-                                    << ". Expected only integer numbers";
-            }
-            // zero and any negative value will be treated
-            // as default batch size
-            batchLimit = std::max(val_i, 0);
        } else if (key == CPUConfigParams::KEY_CPU_SPARSE_WEIGHTS_DECOMPRESSION_RATE) {
            float val_f = 0.0f;
            try {
@ -155,14 +144,6 @@ void Config::readProperties(const std::map<std::string, std::string> &prop) {
            else
                IE_THROW() << "Wrong value for property key " << PluginConfigParams::KEY_EXCLUSIVE_ASYNC_REQUESTS
                                   << ". Expected only YES/NO";
-        } else if (key.compare(PluginConfigParams::KEY_DYN_BATCH_ENABLED) == 0) {
-            if (val.compare(PluginConfigParams::YES) == 0)
-                enableDynamicBatch = true;
-            else if (val.compare(PluginConfigParams::NO) == 0)
-                enableDynamicBatch = false;
-            else
-                IE_THROW() << "Wrong value for property key " << PluginConfigParams::KEY_DYN_BATCH_ENABLED
-                << ". Expected only YES/NO";
            IE_SUPPRESS_DEPRECATED_START
        } else if (key.compare(PluginConfigParams::KEY_DUMP_EXEC_GRAPH_AS_DOT) == 0) {
            IE_SUPPRESS_DEPRECATED_END
@ -307,14 +288,6 @@ void Config::updateProperties() {
        _config.insert({ PluginConfigParams::KEY_EXCLUSIVE_ASYNC_REQUESTS, PluginConfigParams::YES });
    else
        _config.insert({ PluginConfigParams::KEY_EXCLUSIVE_ASYNC_REQUESTS, PluginConfigParams::NO });
-    IE_SUPPRESS_DEPRECATED_START
-    if (enableDynamicBatch == true)
-        _config.insert({ PluginConfigParams::KEY_DYN_BATCH_ENABLED, PluginConfigParams::YES });
-    else
-        _config.insert({ PluginConfigParams::KEY_DYN_BATCH_ENABLED, PluginConfigParams::NO });
-
-    _config.insert({ PluginConfigParams::KEY_DYN_BATCH_LIMIT, std::to_string(batchLimit) });
-    IE_SUPPRESS_DEPRECATED_END

    _config.insert({ PluginConfigParams::KEY_CPU_THROUGHPUT_STREAMS, std::to_string(streamExecutorConfig._streams) });

--- a/src/plugins/intel_cpu/src/config.h
+++ b/src/plugins/intel_cpu/src/config.h
@ -42,11 +42,9 @@ struct Config {

    bool collectPerfCounters = false;
    bool exclusiveAsyncRequests = false;
-    bool enableDynamicBatch = false;
    SnippetsMode snippetsMode = SnippetsMode::Enable;
    std::string dumpToDot = {};
    std::string device_id = {};
-    int batchLimit = 0;
    float fcSparseWeiDecompressionRate = 1.0f;
 #if defined(OPENVINO_ARCH_X86_64)
    size_t rtCacheCapacity = 5000ul;
--- a/src/plugins/intel_cpu/src/exec_network.cpp
+++ b/src/plugins/intel_cpu/src/exec_network.cpp
@ -82,13 +82,6 @@ ExecNetwork::ExecNetwork(const InferenceEngine::CNNNetwork &network,
    _cfg.isNewApi = !isLegacyAPI();
    _mutex = std::make_shared<std::mutex>();

-    if (_cfg.batchLimit > 1) {
-        // check topology for applicability
-        if (!CanProcessDynBatch(_network)) {
-            IE_THROW() << "Graph::CreateGraph: such topology cannot be compiled for dynamic batch!";
-        }
-    }
-
    if (cfg.exclusiveAsyncRequests) {
        // special case when all InferRequests are muxed into a single queue
        _taskExecutor = _plugin->executorManager()->getExecutor("CPU");
@ -378,53 +371,6 @@ InferenceEngine::Parameter ExecNetwork::GetMetric(const std::string &name) const
    return GetMetricLegacy(name, graph);
 }

-bool ExecNetwork::CanProcessDynBatch(const InferenceEngine::CNNNetwork &network) const {
-    InputsDataMap inputs = network.getInputsInfo();
-
-    if (inputs.empty())
-        return false;
-
-    auto function = network.getFunction();
-    if (function == nullptr) {
-        IE_THROW() << "CPU plug-in doesn't support not ngraph-based model!";
-    }
-
-    auto ops = function->get_ordered_ops();
-    for (const auto& op : ops) {
-        auto type = TypeFromName(op->get_type_name());
-        if (type == Type::Tile) {
-            const auto repeatsNode = std::dynamic_pointer_cast<const ngraph::opset1::Constant>(op->get_input_node_shared_ptr(1));
-            if (!repeatsNode)
-                return false;
-            const auto tile = std::dynamic_pointer_cast<const ngraph::opset1::Tile>(op);
-            if (tile && repeatsNode->cast_vector<int64_t>()[0] == 1)
-                continue;
-        }
-
-        if (type == Type::Reshape) {
-            if (op->get_input_shape(0)[0] == op->get_output_shape(0)[0])
-                continue;
-        }
-
-        if (type != Type::Input &&
-            type != Type::Output &&
-            type != Type::Convolution &&
-            type != Type::Deconvolution &&
-            type != Type::Lrn &&
-            type != Type::Pooling &&
-            type != Type::FullyConnected &&
-            type != Type::MatMul &&
-            type != Type::Softmax &&
-            type != Type::Split &&
-            type != Type::Concatenation &&
-                type != Type::Eltwise) {
-            return false;
-        }
-    }
-
-    return true;
-}
-
 void ExecNetwork::Export(std::ostream& modelStream) {
    CNNNetworkSerializer serializer(modelStream, extensionManager);
    serializer <<_network;
--- a/src/plugins/intel_cpu/src/exec_network.h
+++ b/src/plugins/intel_cpu/src/exec_network.h
@ -76,8 +76,6 @@ protected:
     */
    GraphGuard::Lock GetGraph() const;

-    bool CanProcessDynBatch(const InferenceEngine::CNNNetwork &network) const;
-
    bool isLegacyAPI() const;

    InferenceEngine::Parameter GetConfigLegacy(const std::string &name) const;
--- a/src/plugins/intel_cpu/src/graph.cpp
+++ b/src/plugins/intel_cpu/src/graph.cpp
@ -983,14 +983,6 @@ void Graph::PullOutputData(BlobMap &out) {
            outBloMem.SetData(intr_blob, false);
        } else {
            size_t size_to_copy = intr_blob.GetDescWithType<BlockedMemoryDesc>()->getPaddedElementsCount();
-            // used only for backward compatibility with the legacy API
-            if (getConfig().batchLimit && dynBatch > 0) {
-                if (node->isDynamicNode() && !getConfig().isNewApi) {
-                    IE_THROW(NotImplemented) << "[DS] not implemented dynamic batch for node with dynamic shape";
-                }
-
-                size_to_copy = std::accumulate(outDims.begin() + 1, outDims.end(), (size_t)1, std::multiplies<size_t>()) * static_cast<size_t>(dynBatch);
-            }

            cpu_convert(intr_blob_ptr, ext_blob_ptr, srcPrec, dstPrec, size_to_copy);
        }
--- a/src/plugins/intel_cpu/src/graph.h
+++ b/src/plugins/intel_cpu/src/graph.h
@ -190,17 +190,6 @@ public:
        return graphHasDynamicInput;
    }

-    /**
-     * @brief This call updates the dynamic batch value
-     * 
-     * @note It is used for backward compatibility with legacy API only.
-     * @param newDynBatch
-     * new dynamic batch value
-     */
-    void setDynBatch(int newDynBatch) {
-        dynBatch = newDynBatch;
-    }
-
 protected:
    void VisitNode(NodePtr node, std::vector<NodePtr>& sortedNodes);

@ -266,10 +255,6 @@ private:

    GraphContext::CPtr context;

-    // this field stores the dynamic batch value to provide backward compatibility
-    // with the legacy API dyn batch behaviour
-    int dynBatch = -1;
-
    void EnforceBF16();
 };

--- a/src/plugins/intel_cpu/src/infer_request.cpp
+++ b/src/plugins/intel_cpu/src/infer_request.cpp
@ -354,19 +354,6 @@ void LegacyInferRequest::initBlobs() {
    }
 }

-void LegacyInferRequest::SetBatch(int new_batch) {
-    if (!graph->getConfig().enableDynamicBatch)
-        IE_THROW() << "Dynamic batch is not enabled.";
-
-    if (new_batch < 1 || new_batch > graph->getConfig().batchLimit) {
-        IE_THROW() << "Invalid dynamic batch size " << new_batch <<
-            " for this request.";
-    }
-
-    m_curBatch = new_batch;
-    graph->setDynBatch(m_curBatch);
-}
-
 void LegacyInferRequest::changeDefaultPtr() {
    // renew external pointers before infer
    const auto &inMap = graph->inputNodesMap;
@ -448,7 +435,7 @@ void LegacyInferRequest::SetBlob(const std::string& name, const InferenceEngine:

            auto pBlobDesc = MemoryDescUtils::interpretAsBlobDesc(graph->getInputNodeByName(name)->getChildEdgesAtPort(0)[0]->getMemory());
            if (data->getTensorDesc() == pBlobDesc &&
-                graph->_normalizePreprocMap.find(name) == graph->_normalizePreprocMap.end() && !graph->getConfig().batchLimit) {
+                graph->_normalizePreprocMap.find(name) == graph->_normalizePreprocMap.end()) {
                externalPtr[name] = data->buffer();
            } else if (externalPtr.find(name) != externalPtr.end()) {
                externalPtr.erase(name);
@ -481,8 +468,7 @@ void LegacyInferRequest::SetBlob(const std::string& name, const InferenceEngine:
        }

        auto pBlobDesc = MemoryDescUtils::interpretAsBlobDesc(graph->getOutputNodeByName(name)->getParentEdgesAtPort(0)[0]->getMemory());
-        if (data->getTensorDesc() == pBlobDesc &&
-                !graph->getConfig().batchLimit) {
+        if (data->getTensorDesc() == pBlobDesc) {
            externalPtr[name] = data->buffer();
        } else if (externalPtr.find(name) != externalPtr.end()) {
            externalPtr.erase(name);
@ -527,7 +513,7 @@ InferenceEngine::Blob::Ptr LegacyInferRequest::GetBlob(const std::string& name)
            _inputs[name] = make_blob_with_precision(desc);
            _inputs[name]->allocate();
            if (pBlob->getTensorDesc() == desc &&
-                graph->_normalizePreprocMap.find(name) == graph->_normalizePreprocMap.end() && !graph->getConfig().batchLimit) {
+                graph->_normalizePreprocMap.find(name) == graph->_normalizePreprocMap.end()) {
                externalPtr[name] = _inputs[name]->buffer();
            }
        }
@ -589,7 +575,7 @@ InferenceEngine::Blob::Ptr LegacyInferRequest::GetBlob(const std::string& name)
            }

            _outputs[name] = data;
-            if (!externalPtr.count(name) && data->getTensorDesc() == pBlobDesc && !graph->getConfig().batchLimit) {
+            if (!externalPtr.count(name) && data->getTensorDesc() == pBlobDesc) {
                externalPtr[name] = data->buffer();
            }
        }
@ -706,7 +692,7 @@ void InferRequest::SetBlob(const std::string& name, const InferenceEngine::Blob:
                                                                                                                blobDesc.getDims());
        }
        if (actualDesc->isCompatible(MemoryDescUtils::convertToCpuBlockedMemoryDesc(blobDesc)) &&
-                graph->_normalizePreprocMap.find(name) == graph->_normalizePreprocMap.end() && !graph->getConfig().batchLimit) {
+                graph->_normalizePreprocMap.find(name) == graph->_normalizePreprocMap.end()) {
            externalPtr[name] = data->buffer();
        } else if (externalPtr.find(name) != externalPtr.end()) {
            externalPtr.erase(name);
@ -738,7 +724,7 @@ void InferRequest::SetBlob(const std::string& name, const InferenceEngine::Blob:
        }

        const auto &desc = graph->getOutputNodeByName(name)->getParentEdgesAtPort(0)[0]->getMemory().getDesc();
-        if (!isDynamic && blobDesc == MemoryDescUtils::convertToTensorDesc(desc) && !graph->getConfig().batchLimit) {
+        if (!isDynamic && blobDesc == MemoryDescUtils::convertToTensorDesc(desc)) {
            externalPtr[name] = data->buffer();
        } else if (externalPtr.find(name) != externalPtr.end()) {
            externalPtr.erase(name);
@ -786,7 +772,7 @@ InferenceEngine::Blob::Ptr InferRequest::GetBlob(const std::string& name) {

                if (!isDynamic &&
                    desc == MemoryDescUtils::convertToTensorDesc(graph->getInputNodeByName(name)->getChildEdgesAtPort(0)[0]->getMemory().getDesc()) &&
-                        graph->_normalizePreprocMap.find(name) == graph->_normalizePreprocMap.end() && !graph->getConfig().batchLimit) {
+                        graph->_normalizePreprocMap.find(name) == graph->_normalizePreprocMap.end()) {
                    externalPtr[name] = _inputs[name]->buffer();
                }
            } else {
@ -845,8 +831,7 @@ InferenceEngine::Blob::Ptr InferRequest::GetBlob(const std::string& name) {

                _outputs[name] = data;
                if (!isDynamic && !externalPtr.count(name) &&
-                    data->getTensorDesc() == MemoryDescUtils::convertToTensorDesc(output->second->getParentEdgesAtPort(0)[0]->getMemory().getDesc()) &&
-                        !graph->getConfig().batchLimit) {
+                    data->getTensorDesc() == MemoryDescUtils::convertToTensorDesc(output->second->getParentEdgesAtPort(0)[0]->getMemory().getDesc())) {
                    externalPtr[name] = data->buffer();
                }
            } else {
--- a/src/plugins/intel_cpu/src/infer_request.h
+++ b/src/plugins/intel_cpu/src/infer_request.h
@ -84,7 +84,6 @@ public:
 private:
    void PushInputData() override;
    void initBlobs() override;
-    void SetBatch(int batch = -1) override;
    void changeDefaultPtr() override;
 };

--- a/src/plugins/intel_cpu/src/plugin.cpp
+++ b/src/plugins/intel_cpu/src/plugin.cpp
@ -418,13 +418,6 @@ static bool shouldEnforceBF16(const std::map<std::string, std::string>& modelCon
 }

 static Config::SnippetsMode getSnippetsMode(const std::map<std::string, std::string>& modelConfig, const Config& engineConfig) {
-    const auto& dynamicBatchProp = modelConfig.find(InferenceEngine::PluginConfigParams::KEY_DYN_BATCH_ENABLED);
-    const bool enableDynamicBatch = (dynamicBatchProp != modelConfig.end() && dynamicBatchProp->second == PluginConfigParams::YES)
-            || engineConfig.enableDynamicBatch;
-
-    if (enableDynamicBatch) // dynamic batch is not supported
-        return Config::SnippetsMode::Disable;
-
    const auto& snippetsMode = modelConfig.find(InferenceEngine::PluginConfigInternalParams::KEY_SNIPPETS_MODE);
    if (snippetsMode == modelConfig.end()) // not set explicitly
        return Config::SnippetsMode::Enable; // enable by default
@ -501,10 +494,6 @@ Engine::LoadExeNetworkImpl(const InferenceEngine::CNNNetwork &network, const std
    Config conf = engConfig;

    conf.readProperties(config);
-    if (conf.enableDynamicBatch) {
-        conf.batchLimit = static_cast<int>(network.getBatchSize());
-    }
-
    if (is_cpu_map_available()) {
        GetPerformanceStreams(conf, nGraphFunc);
    }
@ -744,10 +733,6 @@ QueryNetworkResult Engine::QueryNetwork(const CNNNetwork& network, const std::ma
    Config conf = engConfig;
    conf.readProperties(config);

-    if (conf.enableDynamicBatch) {
-        conf.batchLimit = static_cast<int>(network.getBatchSize());
-    }
-
    const auto& lptProp = config.find(InferenceEngine::PluginConfigInternalParams::KEY_LP_TRANSFORMS_MODE);
    const bool enableLPT = (lptProp != config.end() && lptProp->second == PluginConfigParams::YES) /* enabled in the orig_config*/
                        || Config::LPTransformsMode::On == engConfig.lpTransformsMode /* or already enabled */;
@ -816,9 +801,6 @@ InferenceEngine::IExecutableNetworkInternal::Ptr Engine::ImportNetwork(std::istr
        }
    }

-    if (conf.enableDynamicBatch) {
-        conf.batchLimit = static_cast<int>(cnnnetwork.getBatchSize());
-    }
    if (is_cpu_map_available()) {
        get_num_streams(conf.streamExecutorConfig._streams, function, conf);
    }
--- a/src/plugins/intel_cpu/tests/functional/shared_tests_instances/behavior/infer_request/config.cpp
+++ b/src/plugins/intel_cpu/tests/functional/shared_tests_instances/behavior/infer_request/config.cpp
@ -20,8 +20,7 @@ namespace {
            {{InferenceEngine::PluginConfigParams::KEY_CPU_THROUGHPUT_STREAMS, InferenceEngine::PluginConfigParams::CPU_THROUGHPUT_NUMA}},
            {{InferenceEngine::PluginConfigParams::KEY_CPU_THROUGHPUT_STREAMS, "8"}},
            {{InferenceEngine::PluginConfigParams::KEY_CPU_BIND_THREAD, InferenceEngine::PluginConfigParams::NO}},
-            {{InferenceEngine::PluginConfigParams::KEY_CPU_BIND_THREAD, InferenceEngine::PluginConfigParams::YES}},
-            {{InferenceEngine::PluginConfigParams::KEY_DYN_BATCH_LIMIT, "10"}},
+            {{InferenceEngine::PluginConfigParams::KEY_CPU_BIND_THREAD, InferenceEngine::PluginConfigParams::YES}}
    };

    const std::vector<std::map<std::string, std::string>> MultiInConfigs = {
@ -36,9 +35,7 @@ namespace {
            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_CPU},
             {InferenceEngine::PluginConfigParams::KEY_CPU_BIND_THREAD, InferenceEngine::PluginConfigParams::NO}},
            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_CPU},
-             {InferenceEngine::PluginConfigParams::KEY_CPU_BIND_THREAD, InferenceEngine::PluginConfigParams::YES}},
-            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_CPU},
-             {InferenceEngine::PluginConfigParams::KEY_DYN_BATCH_LIMIT, "10"}}
+             {InferenceEngine::PluginConfigParams::KEY_CPU_BIND_THREAD, InferenceEngine::PluginConfigParams::YES}}
    };

    INSTANTIATE_TEST_SUITE_P(smoke_BehaviorTests, InferRequestConfigTest,
--- a/src/plugins/intel_cpu/tests/functional/shared_tests_instances/behavior/infer_request/dynamic_batch.cpp
+++ b/src/plugins/intel_cpu/tests/functional/shared_tests_instances/behavior/infer_request/dynamic_batch.cpp
@ -1,39 +0,0 @@
-// Copyright (C) 2018-2023 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#include <behavior/infer_request/dynamic_batch.hpp>
-#include "common_test_utils/test_constants.hpp"
-
-namespace ConfigurationTestsDefinitions {
-namespace {
-std::vector<size_t> batch_sizes = {
-    1,
-    5,
-    9,
-    16
-};
-
-std::map<std::string, std::string> additional_config = {
-};
-} // namespace
-
-
-INSTANTIATE_TEST_SUITE_P(smoke_DynamicBatchTest_async, DynamicBatchTest,
-    ::testing::Combine(
-        ::testing::Values(CommonTestUtils::DEVICE_CPU),
-        ::testing::Values(InferenceEngine::Precision::FP32),
-        ::testing::Values(batch_sizes),
-        ::testing::Values(true),
-        ::testing::Values(additional_config)),
-    DynamicBatchTest::getTestCaseName);
-
-INSTANTIATE_TEST_SUITE_P(smoke_DynamicBatchTest_sync, DynamicBatchTest,
-    ::testing::Combine(
-        ::testing::Values(CommonTestUtils::DEVICE_CPU),
-        ::testing::Values(InferenceEngine::Precision::FP32),
-        ::testing::Values(batch_sizes),
-        ::testing::Values(false),
-        ::testing::Values(additional_config)),
-    DynamicBatchTest::getTestCaseName);
-} // namespace ConfigurationTestsDefinitions
--- a/src/plugins/intel_cpu/tests/functional/shared_tests_instances/behavior/plugin/configuration_tests.cpp
+++ b/src/plugins/intel_cpu/tests/functional/shared_tests_instances/behavior/plugin/configuration_tests.cpp
@ -60,7 +60,6 @@ namespace {
            {{InferenceEngine::PluginConfigParams::KEY_CPU_THROUGHPUT_STREAMS, "8"}},
            {{InferenceEngine::PluginConfigParams::KEY_CPU_BIND_THREAD, InferenceEngine::PluginConfigParams::NO}},
            {{InferenceEngine::PluginConfigParams::KEY_CPU_BIND_THREAD, InferenceEngine::PluginConfigParams::YES}},
-            {{InferenceEngine::PluginConfigParams::KEY_DYN_BATCH_LIMIT, "10"}},
            // check that hints doesn't override customer value (now for streams and later for other config opts)
            {{InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::THROUGHPUT},
             {InferenceEngine::PluginConfigParams::KEY_CPU_THROUGHPUT_STREAMS, "3"}},
@ -137,7 +136,6 @@ namespace {
                    {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS, "should be int"}},
            {{InferenceEngine::PluginConfigParams::KEY_CPU_THROUGHPUT_STREAMS, "OFF"}},
            {{InferenceEngine::PluginConfigParams::KEY_CPU_BIND_THREAD, "OFF"}},
-            {{InferenceEngine::PluginConfigParams::KEY_DYN_BATCH_LIMIT, "NAN"}}
    };

    const std::vector<std::map<std::string, std::string>> multiinconfigs = {
@ -168,8 +166,6 @@ namespace {
                    {InferenceEngine::PluginConfigParams::KEY_CPU_THROUGHPUT_STREAMS, "OFF"}},
            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_CPU},
                    {InferenceEngine::PluginConfigParams::KEY_CPU_BIND_THREAD, "OFF"}},
-            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_CPU},
-                    {InferenceEngine::PluginConfigParams::KEY_DYN_BATCH_LIMIT, "NAN"}},
            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_CPU},
                {InferenceEngine::PluginConfigParams::KEY_MODEL_PRIORITY, "-1"}},
            {{InferenceEngine::MultiDeviceConfigParams::KEY_MULTI_DEVICE_PRIORITIES , CommonTestUtils::DEVICE_CPU},
@ -238,7 +234,6 @@ namespace {
            {{InferenceEngine::PluginConfigParams::KEY_PERF_COUNT, InferenceEngine::PluginConfigParams::YES}},
            {{InferenceEngine::PluginConfigParams::KEY_EXCLUSIVE_ASYNC_REQUESTS, InferenceEngine::PluginConfigParams::NO}},
            {{InferenceEngine::PluginConfigParams::KEY_EXCLUSIVE_ASYNC_REQUESTS, InferenceEngine::PluginConfigParams::YES}},
-            {{InferenceEngine::PluginConfigParams::KEY_DYN_BATCH_LIMIT, "10"}}
    };

    INSTANTIATE_TEST_SUITE_P(smoke_BehaviorTests, CorrectConfigCheck,
--- a/src/plugins/intel_cpu/tests/functional/shared_tests_instances/single_layer_tests/reshape.cpp
+++ b/src/plugins/intel_cpu/tests/functional/shared_tests_instances/single_layer_tests/reshape.cpp
@ -15,20 +15,6 @@ const std::vector<InferenceEngine::Precision> netPrecisions = {
        InferenceEngine::Precision::FP16
 };

-INSTANTIATE_TEST_SUITE_P(smoke_ReshapeCheckDynBatch, ReshapeLayerTest,
-        ::testing::Combine(
-                ::testing::Values(true),
-                ::testing::ValuesIn(netPrecisions),
-                ::testing::Values(InferenceEngine::Precision::UNSPECIFIED),
-                ::testing::Values(InferenceEngine::Precision::UNSPECIFIED),
-                ::testing::Values(InferenceEngine::Layout::ANY),
-                ::testing::Values(InferenceEngine::Layout::ANY),
-                ::testing::Values(std::vector<size_t>({30, 30, 30, 30})),
-                ::testing::Values(std::vector<int64_t>({30, 30, 30, 30})),
-                ::testing::Values(CommonTestUtils::DEVICE_CPU),
-                ::testing::Values(std::map<std::string, std::string>({{CONFIG_KEY(DYN_BATCH_ENABLED), CONFIG_VALUE(YES)}}))),
-                ReshapeLayerTest::getTestCaseName);
-
 INSTANTIATE_TEST_SUITE_P(smoke_ReshapeCheck, ReshapeLayerTest,
        ::testing::Combine(
                ::testing::Values(true),
--- a/src/plugins/intel_gpu/include/intel_gpu/plugin/infer_request_legacy.hpp
+++ b/src/plugins/intel_gpu/include/intel_gpu/plugin/infer_request_legacy.hpp
@ -46,7 +46,7 @@ public:
    void SetBlob(const std::string& name, const InferenceEngine::Blob::Ptr &data) override;
    void SetBlobs(const std::string& name, const std::vector<InferenceEngine::Blob::Ptr> &data) override;

-    void SetBatch(int batch = -1) override;
+    void SetBatch(int batch = -1);
    std::vector<std::shared_ptr<InferenceEngine::IVariableStateInternal>> QueryState() override;
    void SetGraph(std::shared_ptr<Graph> graph);
    void EnableProfiling() { m_useProfiling = true; }
@ -108,6 +108,7 @@ private:
    std::map<cldnn::primitive_id, cldnn::network_output> internal_outputs;
    std::vector<std::map<cldnn::primitive_id, cldnn::network_output>> internal_outputs_dynamic;
    Graph::variable_states_map variables_states_;
+    int m_curBatch = -1;
 };

 }  // namespace intel_gpu
--- a/src/plugins/intel_gpu/include/intel_gpu/runtime/internal_properties.hpp
+++ b/src/plugins/intel_gpu/include/intel_gpu/runtime/internal_properties.hpp
@ -52,7 +52,6 @@ static constexpr Property<std::vector<std::string>, PropertyMutability::RW> cust
 static constexpr Property<ImplForcingMap, PropertyMutability::RW> force_implementations{"GPU_FORCE_IMPLEMENTATIONS"};
 static constexpr Property<std::string, PropertyMutability::RW> config_file{"CONFIG_FILE"};
 static constexpr Property<bool, PropertyMutability::RW> enable_lp_transformations{"LP_TRANSFORMS_MODE"};
-static constexpr Property<bool, PropertyMutability::RW> enable_dynamic_batch{"DYN_BATCH_ENABLED"};
 static constexpr Property<size_t, PropertyMutability::RW> max_dynamic_batch{"DYN_BATCH_LIMIT"};
 static constexpr Property<bool, PropertyMutability::RW> exclusive_async_requests{"EXCLUSIVE_ASYNC_REQUESTS"};
 static constexpr Property<bool, PropertyMutability::RW> nv12_two_inputs{"GPU_NV12_TWO_INPUTS"};
--- a/src/plugins/intel_gpu/src/plugin/compiled_model.cpp
+++ b/src/plugins/intel_gpu/src/plugin/compiled_model.cpp
@ -346,7 +346,6 @@ InferenceEngine::Parameter CompiledModel::GetMetric(const std::string &name) con
            CONFIG_KEY(PERFORMANCE_HINT),
            CONFIG_KEY(PERFORMANCE_HINT_NUM_REQUESTS),
            CONFIG_KEY(PERF_COUNT),
-            CONFIG_KEY(DYN_BATCH_ENABLED),
            CONFIG_KEY(CONFIG_FILE),
            CONFIG_KEY(DEVICE_ID),
            CONFIG_KEY(EXCLUSIVE_ASYNC_REQUESTS),
--- a/src/plugins/intel_gpu/src/plugin/infer_request.cpp
+++ b/src/plugins/intel_gpu/src/plugin/infer_request.cpp
@ -1053,7 +1053,7 @@ std::vector<std::shared_ptr<InferenceEngine::IVariableStateInternal>> InferReque
    std::vector<std::shared_ptr<InferenceEngine::IVariableStateInternal>> ret{};
    ret.reserve(variables_states_.size());
    for (const auto& pair : variables_states_)
-        ret.push_back(std::make_shared<VariableState>(pair.first, pair.second, m_graph->get_engine(), m_curBatch));
+        ret.push_back(std::make_shared<VariableState>(pair.first, pair.second, m_graph->get_engine(), -1));
    return ret;
 }

--- a/src/plugins/intel_gpu/src/plugin/legacy_api_helper.cpp
+++ b/src/plugins/intel_gpu/src/plugin/legacy_api_helper.cpp
@ -229,7 +229,6 @@ std::vector<std::string> LegacyAPIHelper::get_supported_configs() {
        CONFIG_KEY(PERFORMANCE_HINT),
        CONFIG_KEY(PERFORMANCE_HINT_NUM_REQUESTS),
        CONFIG_KEY(PERF_COUNT),
-        CONFIG_KEY(DYN_BATCH_ENABLED),
        CONFIG_KEY(CONFIG_FILE),
        CONFIG_KEY(DEVICE_ID),
        CONFIG_KEY(EXCLUSIVE_ASYNC_REQUESTS),
--- a/src/plugins/intel_gpu/src/plugin/program.cpp
+++ b/src/plugins/intel_gpu/src/plugin/program.cpp
@ -170,22 +170,11 @@ Program::Program(InferenceEngine::CNNNetwork& network, cldnn::engine& engine, co
    bool dyn_shape_batch_found = false;
    std::map<std::string, ngraph::PartialShape> shapes;
    std::map<std::string, std::pair<int64_t, int64_t>> batch_dim;
-    auto enable_dynamic_batch = m_config.get_property(ov::intel_gpu::enable_dynamic_batch);
-    if (enable_dynamic_batch) {
-        m_config.set_property(ov::intel_gpu::max_dynamic_batch(network.getBatchSize()));
-        // in case of legacy dynamic batch,
-        // we assume 4D input with 0 batch dim
-        auto param = func->get_parameters().front();
-        auto pname = getParamName(param);
-        shapes[pname] = param->get_output_partial_shape(0);
-        batch_dim[pname].first = 0;
-        batch_dim[pname].second = m_config.get_property(ov::intel_gpu::max_dynamic_batch);
-    } else {
+
    dyn_shape_batch_found = IsDynBatchModel(func, shapes, batch_dim);
    if (dyn_shape_batch_found) {
        m_config.set_property(ov::intel_gpu::max_dynamic_batch(batch_dim.begin()->second.second));
    }
-    }

    int m_bv_sz = GetMaxBatchSizeForSingleProgram();
    m_max_batch = static_cast<int>(m_config.get_property(ov::intel_gpu::max_dynamic_batch));
--- a/src/plugins/intel_gpu/src/runtime/execution_config.cpp
+++ b/src/plugins/intel_gpu/src/runtime/execution_config.cpp
@ -54,7 +54,6 @@ void ExecutionConfig::set_default() {
        std::make_tuple(ov::intel_gpu::enable_loop_unrolling, true),

        // Legacy API properties
-        std::make_tuple(ov::intel_gpu::enable_dynamic_batch, false),
        std::make_tuple(ov::intel_gpu::exclusive_async_requests, false),
        std::make_tuple(ov::intel_gpu::nv12_two_inputs, false),
        std::make_tuple(ov::intel_gpu::config_file, ""),
--- a/src/plugins/intel_gpu/tests/functional/shared_tests_instances/behavior/infer_request/dynamic_batch.cpp
+++ b/src/plugins/intel_gpu/tests/functional/shared_tests_instances/behavior/infer_request/dynamic_batch.cpp
@ -1,41 +0,0 @@
-// Copyright (C) 2018-2023 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#include <behavior/infer_request/dynamic_batch.hpp>
-#include "common_test_utils/test_constants.hpp"
-
-namespace ConfigurationTestsDefinitions {
-namespace {
-std::vector<size_t> batch_sizes = {
-    16,
-    1,
-    5,
-    9,
-    16
-};
-
-auto additional_config = []() {
-    return std::map<std::string, std::string>{};
-};
-} // namespace
-
-
-INSTANTIATE_TEST_SUITE_P(smoke_DynamicBatchTest_async, DynamicBatchTest,
-    ::testing::Combine(
-        ::testing::Values(CommonTestUtils::DEVICE_GPU),
-        ::testing::Values(InferenceEngine::Precision::FP32),
-        ::testing::Values(batch_sizes),
-        ::testing::Values(true),
-        ::testing::Values(additional_config())),
-    DynamicBatchTest::getTestCaseName);
-
-INSTANTIATE_TEST_SUITE_P(smoke_DynamicBatchTest_sync, DynamicBatchTest,
-    ::testing::Combine(
-        ::testing::Values(CommonTestUtils::DEVICE_GPU),
-        ::testing::Values(InferenceEngine::Precision::FP32),
-        ::testing::Values(batch_sizes),
-        ::testing::Values(false),
-        ::testing::Values(additional_config())),
-    DynamicBatchTest::getTestCaseName);
-} // namespace ConfigurationTestsDefinitions
--- a/src/plugins/intel_gpu/tests/functional/shared_tests_instances/single_layer_tests/reshape.cpp
+++ b/src/plugins/intel_gpu/tests/functional/shared_tests_instances/single_layer_tests/reshape.cpp
@ -15,21 +15,6 @@ const std::vector<InferenceEngine::Precision> netPrecisions = {
            InferenceEngine::Precision::I64
 };

-//TODO: Issue : - 28981
-INSTANTIATE_TEST_SUITE_P(DISABLE_smoke_ReshapeCheckDynBatch, ReshapeLayerTest,
-        ::testing::Combine(
-                ::testing::Values(true),
-                ::testing::ValuesIn(netPrecisions),
-                ::testing::Values(InferenceEngine::Precision::UNSPECIFIED),
-                ::testing::Values(InferenceEngine::Precision::UNSPECIFIED),
-                ::testing::Values(InferenceEngine::Layout::ANY),
-                ::testing::Values(InferenceEngine::Layout::ANY),
-                ::testing::Values(std::vector<size_t>({1, 16, 16, 16})),
-                ::testing::Values(std::vector<int64_t>({1, 0, 256})),
-                 ::testing::Values(CommonTestUtils::DEVICE_GPU),
-                ::testing::Values(std::map<std::string, std::string>({{CONFIG_KEY(DYN_BATCH_ENABLED), CONFIG_VALUE(YES)}}))),
-                ReshapeLayerTest::getTestCaseName);
-
 INSTANTIATE_TEST_SUITE_P(smoke_ReshapeCheck, ReshapeLayerTest,
        ::testing::Combine(
                ::testing::Values(true),
--- a/src/tests/functional/plugin/conformance/test_runner/api_conformance_runner/src/behavior/plugin/configuration_tests.cpp
+++ b/src/tests/functional/plugin/conformance/test_runner/api_conformance_runner/src/behavior/plugin/configuration_tests.cpp
@ -38,7 +38,6 @@ namespace {
            {{InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::LATENCY}},
            {{InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::LATENCY},
                    {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS, "1"}},
-            {{InferenceEngine::PluginConfigParams::KEY_DYN_BATCH_LIMIT, "10"}},
            // check that hints doesn't override customer value (now for streams and later for other config opts)
    };

@ -88,7 +87,6 @@ INSTANTIATE_TEST_SUITE_P(ie_plugin_Hetero, CorrectConfigTests,
                    {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS, "-1"}},
            {{InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::THROUGHPUT},
                    {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS, "should be int"}},
-            {{InferenceEngine::PluginConfigParams::KEY_DYN_BATCH_LIMIT, "NAN"}}
    };

    const std::vector<std::map<std::string, std::string>> pluginMultiInConfigs = {
@ -165,7 +163,6 @@ INSTANTIATE_TEST_SUITE_P(ie_plugin_Hetero, CorrectConfigTests,
            {{InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::LATENCY}},
            {{InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT, InferenceEngine::PluginConfigParams::LATENCY},
                    {InferenceEngine::PluginConfigParams::KEY_PERFORMANCE_HINT_NUM_REQUESTS, "1"}},
-            {{InferenceEngine::PluginConfigParams::KEY_DYN_BATCH_LIMIT, "10"}}
    };

    INSTANTIATE_TEST_SUITE_P(ie_plugin, CorrectConfigCheck,
--- a/src/tests/functional/plugin/shared/include/behavior/infer_request/dynamic_batch.hpp
+++ b/src/tests/functional/plugin/shared/include/behavior/infer_request/dynamic_batch.hpp
@ -1,44 +0,0 @@
-// Copyright (C) 2018-2023 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#pragma once
-
-#include <cstddef>
-#include <vector>
-#include <string>
-#include <tuple>
-
-#include "shared_test_classes/base/layer_test_utils.hpp"
-
-namespace ConfigurationTestsDefinitions {
-typedef std::tuple<
-    std::string,                       // Device
-    InferenceEngine::Precision,        // Network precision
-    std::vector<size_t>,               // Batch sizes
-    bool,                              // Asynchronous execution
-    std::map<std::string, std::string> // Additional configuration
-> dynamicBatchTestParams;
-
-class DynamicBatchTest : virtual public LayerTestsUtils::LayerTestsCommon,
-                         public testing::WithParamInterface<dynamicBatchTestParams> {
-private:
-    bool run_async = false;
-    size_t max_batch_size = 0;
-    std::vector<size_t> batch_sizes;
-    std::vector<std::vector<InferenceEngine::Blob::Ptr>> reference_inputs;
-    std::vector<std::vector<InferenceEngine::Blob::Ptr>> scaled_inputs;
-    std::vector<std::vector<std::pair<ngraph::element::Type, std::vector<std::uint8_t>>>> reference_outputs;
-    std::vector<std::vector<InferenceEngine::Blob::Ptr>> actual_outputs;
-    std::vector<InferenceEngine::InferRequest> infer_requests;
-protected:
-    void SetUp() override;
-    void Run() override;
-
-    void LoadNetwork() override;
-    void Infer() override;
-    void Validate() override;
-public:
-    static std::string getTestCaseName(const testing::TestParamInfo<dynamicBatchTestParams> &obj);
-};
-} // namespace ConfigurationTestsDefinitions
--- a/src/tests/functional/plugin/shared/include/behavior/plugin/preprocessing.hpp
+++ b/src/tests/functional/plugin/shared/include/behavior/plugin/preprocessing.hpp
@ -65,11 +65,6 @@ public:

            inputs.push_back(blob);
        }
-        if (configuration.count(InferenceEngine::PluginConfigParams::KEY_DYN_BATCH_ENABLED) &&
-            configuration.count(InferenceEngine::PluginConfigParams::YES)) {
-            auto batchSize = executableNetwork.GetInputsInfo().begin()->second->getTensorDesc().getDims()[0] / 2;
-            inferRequest.SetBatch(static_cast<int>(batchSize));
-        }
        inferRequest.Infer();
    }

--- a/src/tests/functional/plugin/shared/src/behavior/infer_request/dynamic_batch.cpp
+++ b/src/tests/functional/plugin/shared/src/behavior/infer_request/dynamic_batch.cpp
@ -1,156 +0,0 @@
-// Copyright (C) 2018-2023 Intel Corporation
-// SPDX-License-Identifier: Apache-2.0
-//
-
-#include <tuple>
-#include <string>
-#include <vector>
-#include <algorithm>
-
-#include "ie_core.hpp"
-
-#include "ie_transformations.hpp"
-#include "common_test_utils/common_utils.hpp"
-#include "functional_test_utils/skip_tests_config.hpp"
-#include "behavior/infer_request/dynamic_batch.hpp"
-
-#include "ngraph_functions/subgraph_builders.hpp"
-
-namespace ConfigurationTestsDefinitions {
-
-    std::string DynamicBatchTest::getTestCaseName(const testing::TestParamInfo<dynamicBatchTestParams> &obj) {
-        std::string targetDevice;
-        InferenceEngine::Precision netPrecision;
-        std::vector<size_t> batchSizes;
-        bool runAsync;
-        std::map<std::string, std::string> config;
-        std::tie(targetDevice, netPrecision, batchSizes, runAsync, config) = obj.param;
-        std::ostringstream result;
-
-        result << "netPrecision=" << netPrecision.name() << "_";
-        result << "BS=" << CommonTestUtils::vec2str(batchSizes) << "_";
-        result << std::string(runAsync ? "Async" : "Sync") << "_";
-        result << "targetDevice=" << targetDevice;
-        return result.str();
-    }
-
-    size_t hiddenSize;
-
-
-    void DynamicBatchTest::SetUp() {
-        InferenceEngine::Precision netPrecision;
-        std::map<std::string, std::string> config;
-        std::tie(targetDevice, netPrecision, batch_sizes, run_async, config) = this->GetParam();
-        configuration.insert(config.begin(), config.end());
-        configuration[InferenceEngine::PluginConfigParams::KEY_DYN_BATCH_ENABLED] = InferenceEngine::PluginConfigParams::YES;
-
-        max_batch_size = *std::max_element(batch_sizes.begin(), batch_sizes.end());
-
-        function = ngraph::builder::subgraph::makeSingleConv();
-    }
-
-    void DynamicBatchTest::LoadNetwork() {
-        cnnNetwork = InferenceEngine::CNNNetwork{function};
-        ConfigureNetwork();
-        cnnNetwork.setBatchSize(max_batch_size);
-        executableNetwork = core->LoadNetwork(cnnNetwork, targetDevice, configuration);
-    }
-
-    void DynamicBatchTest::Infer() {
-        inferRequest = executableNetwork.CreateInferRequest();
-        inputs.clear();
-
-        for (int i = 0; i < batch_sizes.size(); i++) {
-            auto batch_size = batch_sizes[i];
-
-            cnnNetwork.setBatchSize(batch_size);
-            inputs.clear();
-            for (const auto &input : cnnNetwork.getInputsInfo()) {
-                const auto &info = input.second;
-                auto blob = GenerateInput(*info);
-                inputs.push_back(blob);
-            }
-            reference_inputs.push_back(inputs);
-            functionRefs = ngraph::clone_function(*function);
-            reference_outputs.push_back(CalculateRefs());
-        }
-
-        for (int i = 0; i < batch_sizes.size(); i++) {
-            infer_requests.push_back(executableNetwork.CreateInferRequest());
-            auto batch_size = batch_sizes[i];
-
-            auto& infer_request = infer_requests[i];
-            infer_request.SetBatch(batch_size);
-
-            inputs.clear();
-            for (const auto &input : executableNetwork.GetInputsInfo()) {
-                const auto &info = input.second;
-                auto blob = GenerateInput(*info);
-                infer_request.SetBlob(info->name(), blob);
-                inputs.push_back(blob);
-            }
-
-            scaled_inputs.push_back(inputs);
-
-            for (int j = 0; j < reference_inputs[i].size(); j++) {
-                auto& ref = reference_inputs[i][j];
-                auto& actual = scaled_inputs[i][j];
-
-                auto byte_num = ref->byteSize();
-                auto ref_ptr = ref->buffer().as<uint8_t*>();
-                auto actual_ptr = actual->buffer().as<uint8_t*>();
-
-                for (int k = 0; k < byte_num; k++) {
-                    actual_ptr[k] = ref_ptr[k];
-                }
-            }
-        }
-
-        for (auto& infer_request : infer_requests) {
-            if (run_async) {
-                infer_request.StartAsync();
-            } else {
-                infer_request.Infer();
-            }
-        }
-
-        if (run_async) {
-            for (auto& infer_request : infer_requests) {
-                auto status = infer_request.Wait(10000);
-                if (status != InferenceEngine::StatusCode::OK) {
-                    GTEST_FAIL() << "Inference request status after wait is not OK";
-                }
-            }
-        }
-    }
-
-    void DynamicBatchTest::Validate() {
-        for (int i = 0; i < infer_requests.size(); i++) {
-            auto outputs = std::vector<InferenceEngine::Blob::Ptr>{};
-            for (const auto &output : executableNetwork.GetOutputsInfo()) {
-                const auto &name = output.first;
-                outputs.push_back(infer_requests[i].GetBlob(name));
-            }
-            for (int j = 0; j < reference_outputs[i].size(); j++) {
-                if (reference_outputs[i][j].second.size() < outputs[j]->byteSize()) {
-                    auto actual_ptr = outputs[j]->buffer().as<uint8_t*>();
-                    for (int k = reference_outputs[i][j].second.size(); k < outputs[j]->byteSize(); k++) actual_ptr[k] = 0;
-                    reference_outputs[i][j].second.resize(outputs[j]->byteSize());
-                }
-            }
-            Compare(reference_outputs[i], outputs);
-        }
-    }
-
-    void DynamicBatchTest::Run() {
-        SKIP_IF_CURRENT_TEST_IS_DISABLED();
-        LoadNetwork();
-        GenerateInputs();
-        Infer();
-        Validate();
-    }
-
-    TEST_P(DynamicBatchTest, CompareWithRefs) {
-        Run();
-    };
-} // namespace ConfigurationTestsDefinitions
--- a/src/tests/functional/shared_test_classes/src/base/layer_test_utils.cpp
+++ b/src/tests/functional/shared_test_classes/src/base/layer_test_utils.cpp
@ -406,11 +406,6 @@ void LayerTestsCommon::ConfigureInferRequest() {
        auto blob = inputs[i];
        inferRequest.SetBlob(info->name(), blob);
    }
-    if (configuration.count(InferenceEngine::PluginConfigParams::KEY_DYN_BATCH_ENABLED) &&
-        configuration.count(InferenceEngine::PluginConfigParams::YES)) {
-        auto batchSize = executableNetwork.GetInputsInfo().begin()->second->getTensorDesc().getDims()[0] / 2;
-        inferRequest.SetBatch(batchSize);
-    }
 }

 void LayerTestsCommon::Infer() {
--- a/src/tests/functional/shared_test_classes/src/subgraph/perm_conv_perm_concat.cpp
+++ b/src/tests/functional/shared_test_classes/src/subgraph/perm_conv_perm_concat.cpp
@ -101,11 +101,6 @@ void PermConvPermConcat::Run() {
        inferRequest.SetBlob(info->name(), blob);
        inputs.push_back(blob);
    }
-    if (configuration.count(InferenceEngine::PluginConfigParams::KEY_DYN_BATCH_ENABLED) &&
-        configuration.count(InferenceEngine::PluginConfigParams::YES)) {
-        auto batchSize = cnnNetwork.getInputsInfo().begin()->second->getTensorDesc().getDims()[0] / 2;
-        inferRequest.SetBatch(batchSize);
-    }
    inferRequest.Infer();

    Validate();
--- a/src/tests/functional/shared_test_classes/src/subgraph/reshape_permute_conv_permute_reshape_act.cpp
+++ b/src/tests/functional/shared_test_classes/src/subgraph/reshape_permute_conv_permute_reshape_act.cpp
@ -97,11 +97,6 @@ namespace SubgraphTestsDefinitions {
            inferRequest.SetBlob(info->name(), blob);
            inputs.push_back(blob);
        }
-        if (configuration.count(InferenceEngine::PluginConfigParams::KEY_DYN_BATCH_ENABLED) &&
-            configuration.count(InferenceEngine::PluginConfigParams::YES)) {
-            auto batchSize = cnnNetwork.getInputsInfo().begin()->second->getTensorDesc().getDims()[0] / 2;
-            inferRequest.SetBatch(batchSize);
-        }
        inferRequest.Infer();

        threshold = 0.1;
--- a/src/tests/ie_test_utils/unit_test_utils/mocks/cpp_interfaces/interface/mock_iinfer_request_internal.hpp
+++ b/src/tests/ie_test_utils/unit_test_utils/mocks/cpp_interfaces/interface/mock_iinfer_request_internal.hpp
@ -22,10 +22,8 @@ public:
    MOCK_CONST_METHOD0(GetPerformanceCounts, std::map<std::string, InferenceEngine::InferenceEngineProfileInfo>());
    MOCK_METHOD2(SetBlob, void(const std::string&, const InferenceEngine::Blob::Ptr &));
    MOCK_METHOD1(GetBlob, InferenceEngine::Blob::Ptr(const std::string&));
-    MOCK_METHOD3(SetBlob, void(const std::string&, const InferenceEngine::Blob::Ptr &, const InferenceEngine::PreProcessInfo&));
    MOCK_CONST_METHOD1(GetPreProcess, const InferenceEngine::PreProcessInfo&(const std::string&));
    MOCK_METHOD1(SetCallback, void(std::function<void(std::exception_ptr)>));
-    MOCK_METHOD1(SetBatch, void(int));
    MOCK_METHOD0(QueryState, std::vector<InferenceEngine::IVariableStateInternal::Ptr>());
    MOCK_METHOD0(Cancel, void());
    MOCK_METHOD0(StartAsyncImpl, void());
--- a/src/tests/ie_test_utils/unit_test_utils/mocks/mock_iinfer_request.hpp
+++ b/src/tests/ie_test_utils/unit_test_utils/mocks/mock_iinfer_request.hpp
@ -34,9 +34,6 @@ public:
    MOCK_METHOD(StatusCode, GetPreProcess,
        (const char*, const PreProcessInfo**, ResponseDesc*), (const, noexcept));
    MOCK_METHOD(StatusCode, SetBlob, (const char*, const Blob::Ptr&, ResponseDesc*), (noexcept));
-    MOCK_METHOD(StatusCode, SetBlob,
-        (const char*, const Blob::Ptr&, const PreProcessInfo&, ResponseDesc*), (noexcept));
-    MOCK_METHOD(StatusCode, SetBatch, (int batch, ResponseDesc*), (noexcept));
    MOCK_METHOD(StatusCode, Cancel, (ResponseDesc*), (noexcept));
 };