nightly/ie_plugin_api/ie__infer__async__request__thread__safe__default_8hpp_source.html

 // Copyright (C) 2018-2021 Intel Corporation

 // SPDX-License-Identifier: Apache-2.0

 //


 #pragma once


 #include <threading/ie_immediate_executor.hpp>

 #include <threading/ie_itask_executor.hpp>

 #include <threading/ie_istreams_executor.hpp>


 #include <cpp_interfaces/interface/ie_iinfer_request_internal.hpp>


 #include <exception>

 #include <future>

 #include <map>

 #include <memory>

 #include <mutex>

 #include <string>

 #include <tuple>

 #include <utility>

 #include <vector>


 namespace InferenceEngine {


 /**

  * @ingroup ie_dev_api_async_infer_request_api

  * @brief Base class with default implementation of asynchronous multi staged inference request.

  *        To customize pipeline stages derived class should change the content

  *        of AsyncInferRequestThreadSafeDefault::_pipeline member container.

  *        It consists of pairs of tasks and executors which will run the task.

  *        The class is recommended to be used by plugins as a base class for asynchronous inference request implementation.

  * @note  To synchronize derived context with stages

  *        derived class should call AsyncInferRequestThreadSafeDefault::StopAndWait() function in destructor.

  * @par Example

  *        Here is an example of asynchronous inference request implementation for some accelerator device.

  *        It uses 5 different executors to run different stages of a synchronous inference request.

  *

  * @snippet example_async_infer_request.cpp async_infer_request:define_pipeline

  */

 class AsyncInferRequestThreadSafeDefault : public IInferRequestInternal {

     enum InferState {Idle, Busy, Canceled, Stop};

     using Futures = std::vector<std::shared_future<void>>;

     using Promise = std::shared_ptr<std::promise<void>>;

     enum Stage_e : std::uint8_t { executor, task };

     IInferRequestInternal::Ptr _syncRequest;


     friend struct DisableCallbackGuard;

     struct DisableCallbackGuard {

         explicit DisableCallbackGuard(AsyncInferRequestThreadSafeDefault* this_)

             : _this{this_} {

                 std::lock_guard<std::mutex> lock{_this->_mutex};

                 std::swap(_callback, _this->_callback);

             }

         ~DisableCallbackGuard() {

             std::lock_guard<std::mutex> lock{_this->_mutex};

             _this->_callback = _callback;

         }

         AsyncInferRequestThreadSafeDefault* _this = nullptr;

         Callback _callback;

     };


     struct ImmediateStreamsExecutor : public InferenceEngine::ITaskExecutor {

         explicit ImmediateStreamsExecutor(const IStreamsExecutor::Ptr& streamsExecutor) : _streamsExecutor{streamsExecutor} {}

         void run(InferenceEngine::Task task) override {_streamsExecutor->Execute(std::move(task));}

         IStreamsExecutor::Ptr _streamsExecutor;

     };


     template<typename F>

     void InferImpl(const F& f) {

         _syncRequest->checkBlobs();

         InferState state = InferState::Idle;

         {

             std::lock_guard<std::mutex> lock{_mutex};

             state = _state;

             switch (_state) {

             case InferState::Busy :

                 IE_THROW(RequestBusy);

             case InferState::Canceled :

                 IE_THROW(InferCancelled);

             case InferState::Idle : {

                 _futures.erase(std::remove_if(std::begin(_futures), std::end(_futures),

                                                 [](const std::shared_future<void>& future) {

                                                     if (future.valid()) {

                                                         return (std::future_status::ready ==

                                                                 future.wait_for(std::chrono::milliseconds {0}));

                                                     } else {

                                                         return true;

                                                     }

                                                 }),

                                 _futures.end());

                 _promise = {};

                 _futures.emplace_back(_promise.get_future().share());

             } break;

             case InferState::Stop : break;

             }

             _state = InferState::Busy;

         }

         if (state != InferState::Stop) {

             try {

                 f();

             } catch (...) {

                 _promise.set_exception(std::current_exception());

                 std::lock_guard<std::mutex> lock{_mutex};

                 _state = InferState::Idle;

                 throw;

             }

         }

     }


 protected:

     /**

      * @brief Throws exception if inference request is busy or canceled

      */

     void CheckState() const {

         std::lock_guard<std::mutex> lock {_mutex};

         switch (_state) {

         case InferState::Busy :

             IE_THROW(RequestBusy);

         case InferState::Canceled :

             IE_THROW(InferCancelled);

         default: break;

         }

     }


 public:

     /**

      * @brief A shared pointer to AsyncInferRequestThreadSafeDefault

      */

     using Ptr = std::shared_ptr<AsyncInferRequestThreadSafeDefault>;


     /**

      * @brief      Wraps a IInferRequestInternal::Ptr implementation and constructs a

      * AsyncInferRequestThreadSafeDefault::_pipeline where `taskExecutor` is used to run IInferRequestInternal::Infer

      * asynchronously.

      *

      * @param[in]  request           The synchronous request

      * @param[in]  taskExecutor      The task executor

      * @param[in]  callbackExecutor  The callback executor

      */

     AsyncInferRequestThreadSafeDefault(const IInferRequestInternal::Ptr& request,

                                        const ITaskExecutor::Ptr& taskExecutor,

                                        const ITaskExecutor::Ptr& callbackExecutor) :

         _syncRequest {request},

         _requestExecutor {taskExecutor},

         _callbackExecutor {callbackExecutor},

         _pipeline {{taskExecutor, [this] {_syncRequest->InferImpl();}}},

         _syncPipeline {{std::make_shared<ImmediateExecutor>(), [this] {_syncRequest->InferImpl();}}} {

         auto streamsExecutor = std::dynamic_pointer_cast<IStreamsExecutor>(taskExecutor);

         if (streamsExecutor != nullptr) {

             _syncPipeline = {{std::make_shared<ImmediateStreamsExecutor>(std::move(streamsExecutor)), [this] {_syncRequest->InferImpl();}}};

         }

     }


     /**

      * @brief      Destroys the object, stops AsyncInferRequestThreadSafeDefault::_pipeline and waits for a finish.

      */

     ~AsyncInferRequestThreadSafeDefault() {

         StopAndWait();

     }


     /**

      * @brief Waits for completion of all pipeline stages

      *        If the pipeline raises an exception it will be rethrown here

      * @param millis_timeout A timeout is `ms` to wait or special enum value of InferRequest::WaitMode

      * @return A status code

      */

     StatusCode Wait(int64_t millis_timeout) override {

         if (millis_timeout < InferRequest::WaitMode::RESULT_READY) {

             IE_THROW(ParameterMismatch)

                 << " Timeout can't be less "

                 << InferRequest::WaitMode::RESULT_READY << " for InferRequest::Wait\n";

         }

         auto status = std::future_status::deferred;


         // Just use the last '_futures' member to wait pipeline completion

         auto future = [&] {

             std::lock_guard<std::mutex> lock {_mutex};

             return _futures.empty() ? std::shared_future<void> {} : _futures.back();

         }();


         if (!future.valid()) {

             return StatusCode::INFER_NOT_STARTED;

         }


         switch (millis_timeout) {

         case InferRequest::WaitMode::RESULT_READY: {

             future.wait();

             status = std::future_status::ready;

         } break;

         case InferRequest::WaitMode::STATUS_ONLY: {

             status = future.wait_for(std::chrono::milliseconds {0});

         } break;

         default: {

             status = future.wait_for(std::chrono::milliseconds {millis_timeout});

         } break;

         }


         if (std::future_status::ready == status) {

             future.get();

             return StatusCode::OK;

         } else {

             return StatusCode::RESULT_NOT_READY;

         }

     }


     void StartAsync() override {

         InferImpl([&] {StartAsync_ThreadUnsafe();});

     }


     void Infer() override {

         DisableCallbackGuard disableCallbackGuard{this};

         InferImpl([&] {Infer_ThreadUnsafe();});

         Wait(InferRequest::WaitMode::RESULT_READY);

     }


     std::map<std::string, InferenceEngineProfileInfo> GetPerformanceCounts() const override {

         CheckState();

         return _syncRequest->GetPerformanceCounts();

     }


     void SetBlob(const std::string& name, const Blob::Ptr& data) override {

         CheckState();

         _syncRequest->SetBlob(name, data);

     }


     void SetBlob(const std::string& name, const Blob::Ptr& data, const PreProcessInfo& info) override {

         CheckState();

         _syncRequest->SetBlob(name, data, info);

     }


     Blob::Ptr GetBlob(const std::string& name) override {

         CheckState();

         return _syncRequest->GetBlob(name);

     }


     const PreProcessInfo& GetPreProcess(const std::string& name) const override {

         return _syncRequest->GetPreProcess(name);

     }


     void SetBatch(int batch) override {

         CheckState();

         _syncRequest->SetBatch(batch);

     };


     void SetCallback(Callback callback) override {

         CheckState();

         _callback = std::move(callback);

     }


     std::vector<std::shared_ptr<InferenceEngine::IVariableStateInternal>> QueryState() override {

         CheckState();

         return _syncRequest->QueryState();

     }


     void ThrowIfCanceled() const {

         std::lock_guard<std::mutex> lock{_mutex};

         if (_state == InferState::Canceled) {

             IE_THROW(InferCancelled);

         }

     }


     void Cancel() override {

         std::lock_guard<std::mutex> lock{_mutex};

         if (_state == InferState::Busy) {

             _state = InferState::Canceled;

         }

     }


 protected:

     /**

      * @brief Each pipeline stage is a @ref Task that is executed by specified ITaskExecutor implementation

      */

     using Stage = std::pair<ITaskExecutor::Ptr, Task>;

     /**

      * @brief Pipeline is vector of stages

      */

     using Pipeline = std::vector<Stage>;


     /**

      * @brief Creates and run the first stage task. If destructor was not called add a new std::future to the

      * AsyncInferRequestThreadSafeDefault::_futures list that would be used to wait

      * AsyncInferRequestThreadSafeDefault::_pipeline finish

      * @param[in]  itBeginStage Iterator to begin of pipeline

      * @param[in]  itEndStage End pipeline iterator

      * @param[in]  callbackExecutor Final or error stage executor

      */

     void RunFirstStage(const Pipeline::iterator itBeginStage, const Pipeline::iterator itEndStage,

                        const ITaskExecutor::Ptr callbackExecutor = {}) {

         auto& firstStageExecutor = std::get<Stage_e::executor>(*itBeginStage);

         IE_ASSERT(nullptr != firstStageExecutor);

         firstStageExecutor->run(MakeNextStageTask(itBeginStage, itEndStage, std::move(callbackExecutor)));

     }


     /**

      * @brief Forbids pipeline start and wait for all started pipelines.

      * @note Should be called in derived class destructor to wait for completion of usage of derived context captured by

      * pipeline tasks

      */

     void StopAndWait() {

         Futures futures;

         InferState state = InferState::Idle;

         {

             std::lock_guard<std::mutex> lock{_mutex};

             state = _state;

             if (state != InferState::Stop) {

                 _callback = {};

                 _state = InferState::Stop;

                 futures = std::move(_futures);

             }

         }

         if (state != InferState::Stop) {

             for (auto&& future : futures) {

                 if (future.valid()) {

                     future.wait();

                 }

             }

         }

     }


     ITaskExecutor::Ptr _requestExecutor;  //!< Used to run inference CPU tasks.

     ITaskExecutor::Ptr _callbackExecutor;  //!< Used to run post inference callback in asynchronous pipline

     ITaskExecutor::Ptr _syncCallbackExecutor;  //!< Used to run post inference callback in synchronous pipline

     Pipeline _pipeline;  //!< Pipeline variable that should be filled by inherited class.

     Pipeline _syncPipeline;  //!< Synchronous pipeline variable that should be filled by inherited class.


     /**

      * @brief Starts an asynchronous pipeline thread unsafe.

      * @note Used by StartAsync which ensures thread-safety and calls this method after.

      */

     virtual void StartAsync_ThreadUnsafe() {

         RunFirstStage(_pipeline.begin(), _pipeline.end(), _callbackExecutor);

     }


     /**

      * @brief Performs inference of pipeline in syncronous mode

      * @note Used by Infer which ensures thread-safety and calls this method after.

      */

     virtual void Infer_ThreadUnsafe() {

         RunFirstStage(_syncPipeline.begin(), _syncPipeline.end(), _syncCallbackExecutor);

     }


     /**

      * @brief Implements Infer() using StartAsync() and Wait()

      */

     void InferUsingAsync() {

         StartAsync_ThreadUnsafe();

     }


 private:

     /**

      * @brief Create a task with next pipeline stage.

      * Each call to MakeNextStageTask() generates @ref Task objects for each stage.

      * On last stage or if the exception is raised from `_pipeline` task

      * the last stage task is called or passed to callback executor if it is presented. The last stage task call the

      * callback, if it is presented, capture the `_promise` member and use it to forward completion or exception to the

      * one of `_futures` member

      * @param[in]  itStage Iterator to next stage of pipeline

      * @param[in]  itEndStage End pipeline iterator

      * @param[in]  callbackExecutor Executor that will run final stage with callback call

      * @return A next stage task

      */

     Task MakeNextStageTask(const Pipeline::iterator itStage, const Pipeline::iterator itEndStage,

                            const ITaskExecutor::Ptr callbackExecutor) {

         return std::bind([this, itStage, itEndStage](ITaskExecutor::Ptr& callbackExecutor) mutable {

             std::exception_ptr currentException = nullptr;

             auto& thisStage = *itStage;

             auto itNextStage = itStage + 1;

             try {

                 auto& stageTask = std::get<Stage_e::task>(thisStage);

                 IE_ASSERT(nullptr != stageTask);

                 stageTask();

                 if (itEndStage != itNextStage) {

                     auto& nextStage = *itNextStage;

                     auto& nextStageExecutor = std::get<Stage_e::executor>(nextStage);

                     IE_ASSERT(nullptr != nextStageExecutor);

                     nextStageExecutor->run(MakeNextStageTask(itNextStage, itEndStage, std::move(callbackExecutor)));

                 }

             } catch (...) {

                 currentException = std::current_exception();

             }


             if ((itEndStage == itNextStage) || (nullptr != currentException)) {

                 auto lastStageTask = [this, currentException]() mutable {

                     auto promise = std::move(_promise);

                     Callback callback;

                     {

                         std::lock_guard<std::mutex> lock{_mutex};

                         _state = InferState::Idle;

                         callback = _callback;

                     }

                     if (callback) {

                         try {

                             auto local_callback = std::move(callback);

                             local_callback(currentException);

                         } catch (...) {

                             currentException = std::current_exception();

                         }

                     }

                     if (nullptr == currentException) {

                         promise.set_value();

                     } else {

                         promise.set_exception(currentException);

                     }

                 };


                 if (nullptr == callbackExecutor) {

                     lastStageTask();

                 } else {

                     callbackExecutor->run(std::move(lastStageTask));

                 }

             }

         }, std::move(callbackExecutor));

     }


     std::promise<void> _promise;

     mutable std::mutex _mutex;

     Futures _futures;

     InferState _state = InferState::Idle;

 };

 }  // namespace InferenceEngine

InferenceEngine::AsyncInferRequestThreadSafeDefault
Base class with default implementation of asynchronous multi staged inference request....
Definition: ie_infer_async_request_thread_safe_default.hpp:40

InferenceEngine::AsyncInferRequestThreadSafeDefault::InferUsingAsync
void InferUsingAsync()
Implements Infer() using StartAsync() and Wait()
Definition: ie_infer_async_request_thread_safe_default.hpp:346

InferenceEngine::AsyncInferRequestThreadSafeDefault::Wait
StatusCode Wait(int64_t millis_timeout) override
Waits for completion of all pipeline stages If the pipeline raises an exception it will be rethrown h...
Definition: ie_infer_async_request_thread_safe_default.hpp:167

InferenceEngine::AsyncInferRequestThreadSafeDefault::GetPerformanceCounts
std::map< std::string, InferenceEngineProfileInfo > GetPerformanceCounts() const override
Queries performance measures per layer to get feedback of what is the most time consuming layer....
Definition: ie_infer_async_request_thread_safe_default.hpp:216

InferenceEngine::AsyncInferRequestThreadSafeDefault::RunFirstStage
void RunFirstStage(const Pipeline::iterator itBeginStage, const Pipeline::iterator itEndStage, const ITaskExecutor::Ptr callbackExecutor={})
Creates and run the first stage task. If destructor was not called add a new std::future to the Async...
Definition: ie_infer_async_request_thread_safe_default.hpp:287

InferenceEngine::AsyncInferRequestThreadSafeDefault::Stage
std::pair< ITaskExecutor::Ptr, Task > Stage
Each pipeline stage is a Task that is executed by specified ITaskExecutor implementation.
Definition: ie_infer_async_request_thread_safe_default.hpp:273

InferenceEngine::AsyncInferRequestThreadSafeDefault::SetBlob
void SetBlob(const std::string &name, const Blob::Ptr &data) override
Set input/output data to infer.
Definition: ie_infer_async_request_thread_safe_default.hpp:221

InferenceEngine::AsyncInferRequestThreadSafeDefault::Ptr
std::shared_ptr< AsyncInferRequestThreadSafeDefault > Ptr
A shared pointer to AsyncInferRequestThreadSafeDefault.
Definition: ie_infer_async_request_thread_safe_default.hpp:129

InferenceEngine::AsyncInferRequestThreadSafeDefault::Cancel
void Cancel() override
Cancel current inference request execution.
Definition: ie_infer_async_request_thread_safe_default.hpp:262

InferenceEngine::AsyncInferRequestThreadSafeDefault::Infer
void Infer() override
Infers specified input(s) in synchronous mode.
Definition: ie_infer_async_request_thread_safe_default.hpp:210

InferenceEngine::AsyncInferRequestThreadSafeDefault::SetBatch
void SetBatch(int batch) override
Sets new batch size when dynamic batching is enabled in executable network that created this request.
Definition: ie_infer_async_request_thread_safe_default.hpp:240

InferenceEngine::AsyncInferRequestThreadSafeDefault::_syncCallbackExecutor
ITaskExecutor::Ptr _syncCallbackExecutor
Used to run post inference callback in synchronous pipline.
Definition: ie_infer_async_request_thread_safe_default.hpp:323

InferenceEngine::AsyncInferRequestThreadSafeDefault::SetCallback
void SetCallback(Callback callback) override
Set callback function which will be called on success or failure of asynchronous request.
Definition: ie_infer_async_request_thread_safe_default.hpp:245

InferenceEngine::AsyncInferRequestThreadSafeDefault::AsyncInferRequestThreadSafeDefault
AsyncInferRequestThreadSafeDefault(const IInferRequestInternal::Ptr &request, const ITaskExecutor::Ptr &taskExecutor, const ITaskExecutor::Ptr &callbackExecutor)
Wraps a IInferRequestInternal::Ptr implementation and constructs a AsyncInferRequestThreadSafeDefault...
Definition: ie_infer_async_request_thread_safe_default.hpp:140

InferenceEngine::AsyncInferRequestThreadSafeDefault::GetBlob
Blob::Ptr GetBlob(const std::string &name) override
Get input/output data to infer.
Definition: ie_infer_async_request_thread_safe_default.hpp:231

InferenceEngine::AsyncInferRequestThreadSafeDefault::StartAsync_ThreadUnsafe
virtual void StartAsync_ThreadUnsafe()
Starts an asynchronous pipeline thread unsafe.
Definition: ie_infer_async_request_thread_safe_default.hpp:331

InferenceEngine::AsyncInferRequestThreadSafeDefault::Pipeline
std::vector< Stage > Pipeline
Pipeline is vector of stages.
Definition: ie_infer_async_request_thread_safe_default.hpp:277

InferenceEngine::AsyncInferRequestThreadSafeDefault::StartAsync
void StartAsync() override
Start inference of specified input(s) in asynchronous mode.
Definition: ie_infer_async_request_thread_safe_default.hpp:206

InferenceEngine::AsyncInferRequestThreadSafeDefault::_syncPipeline
Pipeline _syncPipeline
Synchronous pipeline variable that should be filled by inherited class.
Definition: ie_infer_async_request_thread_safe_default.hpp:325

InferenceEngine::AsyncInferRequestThreadSafeDefault::CheckState
void CheckState() const
Throws exception if inference request is busy or canceled.
Definition: ie_infer_async_request_thread_safe_default.hpp:114

InferenceEngine::AsyncInferRequestThreadSafeDefault::SetBlob
void SetBlob(const std::string &name, const Blob::Ptr &data, const PreProcessInfo &info) override
Sets pre-process for input data.
Definition: ie_infer_async_request_thread_safe_default.hpp:226

InferenceEngine::AsyncInferRequestThreadSafeDefault::~AsyncInferRequestThreadSafeDefault
~AsyncInferRequestThreadSafeDefault()
Destroys the object, stops AsyncInferRequestThreadSafeDefault::_pipeline and waits for a finish.
Definition: ie_infer_async_request_thread_safe_default.hpp:157

InferenceEngine::AsyncInferRequestThreadSafeDefault::_callbackExecutor
ITaskExecutor::Ptr _callbackExecutor
Used to run post inference callback in asynchronous pipline.
Definition: ie_infer_async_request_thread_safe_default.hpp:322

InferenceEngine::AsyncInferRequestThreadSafeDefault::Infer_ThreadUnsafe
virtual void Infer_ThreadUnsafe()
Performs inference of pipeline in syncronous mode.
Definition: ie_infer_async_request_thread_safe_default.hpp:339

InferenceEngine::AsyncInferRequestThreadSafeDefault::QueryState
std::vector< std::shared_ptr< InferenceEngine::IVariableStateInternal > > QueryState() override
Queries memory states.
Definition: ie_infer_async_request_thread_safe_default.hpp:250

InferenceEngine::AsyncInferRequestThreadSafeDefault::_pipeline
Pipeline _pipeline
Pipeline variable that should be filled by inherited class.
Definition: ie_infer_async_request_thread_safe_default.hpp:324

InferenceEngine::AsyncInferRequestThreadSafeDefault::StopAndWait
void StopAndWait()
Forbids pipeline start and wait for all started pipelines.
Definition: ie_infer_async_request_thread_safe_default.hpp:299

InferenceEngine::AsyncInferRequestThreadSafeDefault::_requestExecutor
ITaskExecutor::Ptr _requestExecutor
Used to run inference CPU tasks.
Definition: ie_infer_async_request_thread_safe_default.hpp:321

InferenceEngine::AsyncInferRequestThreadSafeDefault::GetPreProcess
const PreProcessInfo & GetPreProcess(const std::string &name) const override
Gets pre-process for input data.
Definition: ie_infer_async_request_thread_safe_default.hpp:236

InferenceEngine::Blob::Ptr
std::shared_ptr< Blob > Ptr

InferenceEngine::IInferRequestInternal
An internal API of synchronous inference request to be implemented by plugin, which is used in InferR...
Definition: ie_iinfer_request_internal.hpp:28

InferenceEngine::IInferRequestInternal::InferImpl
virtual void InferImpl()
The minimal infer function to be implemented by plugins. It infers specified input(s) in synchronous ...

InferenceEngine::IInferRequestInternal::_callback
Callback _callback
A callback.
Definition: ie_iinfer_request_internal.hpp:239

InferenceEngine::IInferRequestInternal::Ptr
std::shared_ptr< IInferRequestInternal > Ptr
A shared pointer to a IInferRequestInternal interface.
Definition: ie_iinfer_request_internal.hpp:33

InferenceEngine::IInferRequestInternal::Callback
std::function< void(std::exception_ptr)> Callback
Alias for callback type.
Definition: ie_iinfer_request_internal.hpp:147

InferenceEngine::IStreamsExecutor::Ptr
std::shared_ptr< IStreamsExecutor > Ptr
Definition: ie_istreams_executor.hpp:36

InferenceEngine::ITaskExecutor
Interface for Task Executor. Inference Engine uses InferenceEngine::ITaskExecutor interface to run al...
Definition: ie_itask_executor.hpp:46

InferenceEngine::ITaskExecutor::Ptr
std::shared_ptr< ITaskExecutor > Ptr
Definition: ie_itask_executor.hpp:51

InferenceEngine::PreProcessInfo

InferenceEngine::Task
std::function< void()> Task
Inference Engine Task Executor can use any copyable callable without parameters and output as a task....
Definition: ie_itask_executor.hpp:25

IE_THROW
#define IE_THROW(...)

IE_ASSERT
#define IE_ASSERT(EXPRESSION)

ie_immediate_executor.hpp
A header file for Inference Engine Immediate Executor implementation.

ie_istreams_executor.hpp
A header file for Inference Engine Streams-based Executor Interface.

ie_itask_executor.hpp
A header file for Inference Engine Task Executor Interface.

InferenceEngine
Inference Engine Plugin API namespace.

InferenceEngine::StatusCode
StatusCode