/*
|
* Copyright (C) 2017 The Android Open Source Project
|
*
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
* you may not use this file except in compliance with the License.
|
* You may obtain a copy of the License at
|
*
|
* http://www.apache.org/licenses/LICENSE-2.0
|
*
|
* Unless required by applicable law or agreed to in writing, software
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
* See the License for the specific language governing permissions and
|
* limitations under the License.
|
*/
|
|
#ifndef ANDROID_ML_NN_RUNTIME_CALLBACKS_H
|
#define ANDROID_ML_NN_RUNTIME_CALLBACKS_H
|
|
#include <android-base/thread_annotations.h>
|
#include <android/hardware/neuralnetworks/1.0/IExecutionCallback.h>
|
#include <android/hardware/neuralnetworks/1.0/IPreparedModelCallback.h>
|
#include <android/hardware/neuralnetworks/1.2/IExecutionCallback.h>
|
#include <android/hardware/neuralnetworks/1.2/IPreparedModelCallback.h>
|
#include <hidl/MQDescriptor.h>
|
#include <hidl/Status.h>
|
#include <condition_variable>
|
#include <functional>
|
#include <mutex>
|
#include <thread>
|
|
/*
|
* The Callback classes are used internally by the NeuralNetworks runtime to
|
* synchronize between different threads. An asynchronous task is launched
|
* paired with a callback object. When a client thread requires the output being
|
* generated by the asynchronous task, the client thread can wait for the result
|
* and be blocked until it has completed. Any wait may safely be called
|
* concurrently, even on the same callback object. When the asynchronous task
|
* has finished its workload, it must immediately call "notify*". If the
|
* asynchronous task has failed to launch, the function that tried to launch the
|
* asynchronous task must immediately call "notify*". This "notify*" call
|
* awakens any client threads waiting on the callback object.
|
*
|
* These classes exist to enable synchronization across HIDL. When
|
* synchronization is only required in the same process, consider using
|
* std::future, std::mutex, std::condition_variable, or std::experimental::latch
|
* instead.
|
*/
|
|
namespace android::hardware::neuralnetworks::V1_2::implementation {
|
|
using V1_0::ErrorStatus;
|
|
/**
|
* The PreparedModelCallback class is used to receive the error status of
|
* preparing a model as well as the prepared model from a task executing
|
* asynchronously with respect to the runtime. If a calling thread calls wait
|
* or get* on a PreparedModelCallback object and the corresponding asynchronous
|
* task has not finished preparing the model, the calling thread will block
|
* until the asynchronous task has either called notify or notify_1_2.
|
*
|
* If the callback object is notified more than once, only the results of the
|
* first call to notify* are used, and the results from subsequent calls are
|
* discarded.
|
*
|
* This callback object is passed as an argument to IDevice::prepareModel*.
|
*/
|
class PreparedModelCallback : public IPreparedModelCallback {
|
public:
|
/**
|
* IPreparedModelCallback::notify marks the callback object with the return
|
* status of the asynchronous model preparation along with the prepared
|
* model, and allows all prior and future wait calls on the
|
* PreparedModelCallback object to proceed.
|
*
|
* Either IPreparedModelCallback::notify or
|
* IPreparedModelCallback::notify_1_2 must be called on a given
|
* PreparedModelCallback object.
|
*
|
* If the callback object is notified more than once, only the results of
|
* the first call to notify* are used, and the results from subsequent calls
|
* are discarded.
|
*
|
* @param status Error status returned from asynchronously preparing the
|
* model; will be:
|
* - NONE if the asynchronous preparation was successful
|
* - DEVICE_UNAVAILABLE if driver is offline or busy
|
* - GENERAL_FAILURE if there is an unspecified error
|
* - INVALID_ARGUMENT if the input model is invalid
|
* @param preparedModel Returned model that has been prepared for execution,
|
* nullptr if the model was unable to be prepared.
|
*/
|
Return<void> notify(ErrorStatus status, const sp<V1_0::IPreparedModel>& preparedModel) override;
|
|
/**
|
* IPreparedModelCallback::notify_1_2 marks the callback object with the
|
* return status of the asynchronous model preparation along with the
|
* prepared model, and allows all prior and future wait calls on the
|
* PreparedModelCallback object to proceed.
|
*
|
* Either IPreparedModelCallback::notify or
|
* IPreparedModelCallback::notify_1_2 must be called on a given
|
* PreparedModelCallback object.
|
*
|
* If the callback object is notified more than once, only the results of
|
* the first call to notify* are used, and the results from subsequent calls
|
* are discarded.
|
*
|
* @param status Error status returned from asynchronously preparing the
|
* model; will be:
|
* - NONE if the asynchronous preparation was successful
|
* - DEVICE_UNAVAILABLE if driver is offline or busy
|
* - GENERAL_FAILURE if there is an unspecified error
|
* - INVALID_ARGUMENT if the input model is invalid
|
* @param preparedModel Returned model that has been prepared for execution,
|
* nullptr if the model was unable to be prepared.
|
*/
|
Return<void> notify_1_2(ErrorStatus status,
|
const sp<V1_2::IPreparedModel>& preparedModel) override;
|
|
/**
|
* PreparedModelCallback::wait blocks until notify* has been called on the
|
* callback object.
|
*/
|
void wait() const;
|
|
/**
|
* Retrieves the error status returned from the asynchronous task launched
|
* by IDevice::prepareModel*. If IDevice::prepareModel* has not finished
|
* asynchronously preparing the model, this call will block until the
|
* asynchronous task notifies the object.
|
*
|
* @return status Error status returned from asynchronously preparing the
|
* model; will be:
|
* - NONE if the asynchronous preparation was successful
|
* - DEVICE_UNAVAILABLE if driver is offline or busy
|
* - GENERAL_FAILURE if there is an unspecified error
|
* - INVALID_ARGUMENT if the input model is invalid
|
*/
|
ErrorStatus getStatus() const;
|
|
/**
|
* Retrieves the model that has been prepared for execution from the
|
* asynchronous task launched by IDevice::prepareModel*. If
|
* IDevice::prepareModel* has not finished asynchronously preparing the
|
* model, this call will block until the asynchronous task notifies the
|
* object.
|
*
|
* @return preparedModel Returned model that has been prepared for
|
* execution, nullptr if the model was unable to be prepared.
|
*/
|
sp<V1_0::IPreparedModel> getPreparedModel() const;
|
|
private:
|
mutable std::mutex mMutex;
|
mutable std::condition_variable mCondition;
|
bool mNotified GUARDED_BY(mMutex) = false;
|
ErrorStatus mErrorStatus = ErrorStatus::GENERAL_FAILURE;
|
sp<V1_0::IPreparedModel> mPreparedModel;
|
};
|
|
/**
|
* The ExecutionCallback class is used to receive the results of the execution
|
* from a task executing asynchronously with respect to the runtime. If a
|
* calling thread calls wait or get* on a ExecutionCallback object and the
|
* corresponding asynchronous task has not finished the execution, the calling
|
* thread will block until the asynchronous task has either called notify or
|
* notify_1_2.
|
*
|
* If the callback object is notified more than once, only the results of the
|
* first call to notify* are used, and the results from subsequent calls are
|
* discarded.
|
*
|
* This callback object is passed as an argument to IPreparedModel::execute*.
|
*/
|
class ExecutionCallback : public IExecutionCallback {
|
using ExecutionFinish =
|
std::function<ErrorStatus(ErrorStatus, const std::vector<OutputShape>&)>;
|
|
public:
|
/**
|
* IExecutionCallback::notify marks the callback object with the return
|
* status of the asynchronous execution that held this callback and enables
|
* all prior and future wait calls on the ExecutionCallback object to
|
* proceed.
|
*
|
* Either IExecutionCallback::notify or IExecutionCallback::notify_1_2 must
|
* be called on a given ExecutionCallback object.
|
*
|
* If the callback object is notified more than once, only the results of
|
* the first call to notify* are used, and the results from subsequent calls
|
* are discarded.
|
*
|
* @param status Error status returned from launching the asynchronous task
|
* (if the launch fails) or from the asynchronous task itself (if the
|
* launch succeeds). Must be:
|
* - NONE if the asynchronous execution was successful
|
* - DEVICE_UNAVAILABLE if driver is offline or busy
|
* - GENERAL_FAILURE if there is an unspecified error
|
* - OUTPUT_INSUFFICIENT_SIZE if provided output buffer is not large
|
* enough to store the resultant values
|
* - INVALID_ARGUMENT if the input request is invalid
|
*/
|
Return<void> notify(ErrorStatus status) override;
|
|
/**
|
* IExecutionCallback::notify_1_2 marks the callback object with the results
|
* (error status, dynamic output shapes, and timing information) of the
|
* asynchronous execution that held this callback and enables all prior and
|
* future wait calls on the ExecutionCallback object to proceed.
|
*
|
* Either IExecutionCallback::notify or IExecutionCallback::notify_1_2 must
|
* be called on a given ExecutionCallback object.
|
*
|
* If the callback object is notified more than once, only the results of
|
* the first call to notify* are used, and the results from subsequent calls
|
* are discarded.
|
*
|
* @param status Error status returned from launching the asynchronous task
|
* (if the launch fails) or from the asynchronous task itself (if the
|
* launch succeeds). Must be:
|
* - NONE if the asynchronous execution was successful
|
* - DEVICE_UNAVAILABLE if driver is offline or busy
|
* - GENERAL_FAILURE if the asynchronous task resulted in an unspecified
|
* error
|
* - OUTPUT_INSUFFICIENT_SIZE if at least one output operand buffer is
|
* not large enough to store the corresponding output
|
* - INVALID_ARGUMENT if one of the input arguments to prepareModel is
|
* invalid
|
* @param outputShapes A list of shape information of model output operands.
|
* The index into "outputShapes" corresponds to the index of the output
|
* operand in the Request outputs vector. outputShapes must be empty
|
* unless the status is either NONE or OUTPUT_INSUFFICIENT_SIZE.
|
* @param Timing Duration of execution. Unless MeasureTiming::YES was passed
|
* when launching the execution and status is NONE, all times must be
|
* reported as UINT64_MAX. A driver may choose to report any time as
|
* UINT64_MAX, indicating that particular measurement is not available.
|
*/
|
Return<void> notify_1_2(ErrorStatus status, const hidl_vec<OutputShape>& outputShapes,
|
const Timing& timing) override;
|
|
// An overload of the latest notify interface to hide the version from ExecutionBuilder.
|
Return<void> notify(ErrorStatus status, const hidl_vec<OutputShape>& outputShapes,
|
const Timing& timing) {
|
return notify_1_2(status, outputShapes, timing);
|
}
|
|
/**
|
* ExecutionCallback::wait blocks until notify* has been called on the
|
* callback object.
|
*/
|
void wait() const;
|
|
/**
|
* Retrieves the error status returned from the asynchronous task launched
|
* by either IPreparedModel::execute or IPreparedModel::execute_1_2. If
|
* IPreparedModel::execute or IPreparedModel::execute_1_2 has not finished
|
* asynchronously executing, this call will block until the asynchronous
|
* task notifies the object.
|
*
|
* @return status Error status returned from launching the asynchronous task
|
* (if the launch fails) or from the asynchronous task itself (if the
|
* launch succeeds). Must be:
|
* - NONE if the asynchronous execution was successful
|
* - DEVICE_UNAVAILABLE if driver is offline or busy
|
* - GENERAL_FAILURE if the asynchronous task resulted in an unspecified
|
* error
|
* - OUTPUT_INSUFFICIENT_SIZE if at least one output operand buffer is
|
* not large enough to store the corresponding output
|
* - INVALID_ARGUMENT if one of the input arguments to prepareModel is
|
* invalid
|
*/
|
ErrorStatus getStatus() const;
|
|
/**
|
* Retrieves the output shapes returned from the asynchronous task launched
|
* by IPreparedModel::execute_1_2. If IPreparedModel::execute_1_2 has not
|
* finished asynchronously executing, this call will block until the
|
* asynchronous task notifies the object.
|
*
|
* If the asynchronous task was launched by IPreparedModel::execute, an
|
* empty vector will be returned.
|
*
|
* @return outputShapes A list of shape information of model output
|
* operands. The index into "outputShapes" corresponds to the index of
|
* the output operand in the Request outputs vector. outputShapes must
|
* be empty unless the status is either NONE or
|
* OUTPUT_INSUFFICIENT_SIZE. outputShaps may be empty if the status is
|
* NONE and all model output operands are fully-specified at execution
|
* time. outputShapes must have the same number of elements as the
|
* number of model output operands if the status is
|
* OUTPUT_INSUFFICIENT_SIZE, or if the status is NONE and the model has
|
* at least one output operand that is not fully-specified.
|
*/
|
const std::vector<OutputShape>& getOutputShapes() const;
|
|
/**
|
* Retrieves the duration of execution of the asynchronous task launched by
|
* IPreparedModel::execute_1_2. If IPreparedModel::execute_1_2 has not
|
* finished asynchronously executing, this call will block until the
|
* asynchronous task notifies the object.
|
*
|
* If the asynchronous task was launched by IPreparedModel::execute, every
|
* time must be UINT64_MAX.
|
*
|
* @return timing Duration of the execution. Every time must be UINT64_MAX
|
* unless the status is NONE.
|
*/
|
Timing getTiming() const;
|
|
/**
|
* ExecutionCallback::bindThread binds a thread to the ExecutionCallback
|
* object. The bound thread is later joined by ExecutionCallback::wait or
|
* ExecutionCallback::get*.
|
*
|
* Once a thread is bound with ExecutionCallback::bindThread, the client
|
* code must ensure that ExecutionCallback::wait or ExecutionCallback::get*
|
* has been called before the ExecutionCallback object is destroyed.
|
*
|
* The bound thread must not call any ExecutionCallback method with the
|
* exception of ExecutionCallback::notify*, which it must call when the
|
* thread has finished its computation.
|
*
|
* ExecutionCallback::bindThread can be called at most once on a given
|
* callback object.
|
*
|
* @param asyncThread Thread to be bound to the callback object. The thread
|
* object must represent a thread of execution -- i.e.,
|
* std::thread::joinable() must be true.
|
* @return bool True if successful, false if thread was not properly bound.
|
*/
|
bool bindThread(std::thread asyncThread);
|
|
/**
|
* ExecutionCallback::setOnFinish binds a callback to the ExecutionCallback
|
* object that will be executed during one of the ExecutionCallback::notify*
|
* calls but before any calls to wait or get* return. This provided callback
|
* is provided with both the ErrorStatus and the output shapes from
|
* ExecutionCallback::notify*.
|
*
|
* The bound function must not synchronize with or otherwise access the
|
* callback object it is bound to, as this could cause a deadlock.
|
*
|
* This call will not bind the provided callback if any of the following
|
* occur:
|
* (1) the provided callback is invalid (i.e., "(bool) finish" is false)
|
* (2) ExecutionCallback already contains a bound callback
|
* (3) ExecutionCallback has already been notified with results
|
*
|
* @param finish Callback to be executed when ExecutionCallback is notified
|
* with results.
|
*/
|
void setOnFinish(const ExecutionFinish& finish);
|
|
private:
|
/*
|
* ExecutionCallback::notifyInternal stores the results of the execution
|
* (status, output shapes, and timing information) in the ExecutionCallback
|
* object and invokes the bound callback function "mOnFinish" (if present)
|
* before any call to wait or get* return. It then enables all prior and
|
* future wait calls on the ExecutionCallback object to proceed.
|
*/
|
void notifyInternal(ErrorStatus errorStatus, const hidl_vec<OutputShape>& outputShapes,
|
const Timing& timing);
|
|
// members
|
mutable std::mutex mMutex;
|
mutable std::condition_variable mCondition;
|
mutable std::thread mThread GUARDED_BY(mMutex);
|
ExecutionFinish mOnFinish GUARDED_BY(mMutex);
|
bool mNotified GUARDED_BY(mMutex) = false;
|
ErrorStatus mErrorStatus = ErrorStatus::GENERAL_FAILURE;
|
std::vector<OutputShape> mOutputShapes = {};
|
Timing mTiming = {};
|
};
|
|
} // namespace android::hardware::neuralnetworks::V1_2::implementation
|
|
namespace android::nn {
|
|
using ::android::hardware::neuralnetworks::V1_2::implementation::ExecutionCallback;
|
using ::android::hardware::neuralnetworks::V1_2::implementation::PreparedModelCallback;
|
|
} // namespace android::nn
|
|
#endif // ANDROID_ML_NN_RUNTIME_CALLBACKS_H
|