| /* |
| * Copyright (C) 2020 The Android Open Source Project |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| #ifndef ANDROID_FRAMEWORKS_ML_NN_COMMON_NNAPI_IPREPARED_MODEL_H |
| #define ANDROID_FRAMEWORKS_ML_NN_COMMON_NNAPI_IPREPARED_MODEL_H |
| |
| #include <any> |
| #include <functional> |
| #include <memory> |
| #include <utility> |
| #include <vector> |
| |
| #include "nnapi/Types.h" |
| |
| namespace android::nn { |
| |
| // Returns status, timingLaunched, timingFenced |
| using ExecuteFencedInfoCallback = std::function<GeneralResult<std::pair<Timing, Timing>>()>; |
| |
| /** |
| * IPreparedModel describes a model that has been prepared for execution and is used to launch |
| * executions. |
| * |
| * This interface is thread-safe, and any class that implements this interface must be thread-safe. |
| */ |
| class IPreparedModel { |
| public: |
| /** |
| * Performs a synchronous execution on a prepared model. |
| * |
| * The execution is performed synchronously with respect to the caller. IPreparedModel::execute |
| * must verify the inputs to the function are correct. If there is an error, |
| * IPreparedModel::execute must immediately return {@link ErrorStatus::INVALID_ARGUMENT} as a |
| * ExecutionError. If the inputs to the function are valid and there is no error, |
| * IPreparedModel::execute must perform the execution, and must not return until the execution |
| * is complete. |
| * |
| * The caller must not change the content of any data object referenced by request (described by |
| * the {@link DataLocation} of a {@link RequestArgument}) until IPreparedModel::execute returns. |
| * IPreparedModel::execute must not change the content of any of the data objects corresponding |
| * to request inputs. |
| * |
| * If the prepared model was prepared from a model wherein all tensor operands have fully |
| * specified dimensions, and the inputs to the function are valid, and at execution time every |
| * operation's input operands have legal values, then the execution should complete |
| * successfully. There must be no failure unless the device itself is in a bad state. |
| * |
| * IPreparedModel::execute may be called with an optional deadline. If the execution is not |
| * able to be completed before the provided deadline, the execution may be aborted, and either |
| * {@link ErrorStatus::MISSED_DEADLINE_TRANSIENT} or {@link |
| * ErrorStatus::MISSED_DEADLINE_PERSISTENT} may be returned as a ExecutionError. |
| * |
| * @param request The input and output information on which the prepared model is to be |
| * executed. |
| * @param measure Specifies whether or not to measure duration of the execution. |
| * @param deadline Optional time point. If provided, execute is expected to complete by this |
| * time point. If it is not able to be completed by the deadline, the execution may be |
| * aborted. |
| * @param loopTimeoutDuration The maximum amount of time that should be spent executing a {@link |
| * OperationType::WHILE} operation. If a loop condition model does not output `false` within |
| * this duration, the execution must be aborted. If no loop timeout duration is provided, |
| * the maximum amount of time is {@link LoopTimeoutDurationNs::DEFAULT}. When provided, the |
| * duration must not exceed {@link LoopTimeoutDurationNs::MAXIMUM}. |
| * @return A pair consisting of: |
| * - A list of shape information of model output operands. The index into "outputShapes" |
| * corresponds to the index of the output operand in the Request outputs vector. |
| * outputShapes must be empty unless the execution is successful or the ExecutionResult is |
| * {@link ErrorStatus::OUTPUT_INSUFFICIENT_SIZE}. outputShapes may be empty if the |
| * execution is successful and all model output operands are fully-specified at execution |
| * time. outputShapes must have the same number of elements as the number of model output |
| * operands if the ExecutionResult is {@link ErrorStatus::OUTPUT_INSUFFICIENT_SIZE}, or if |
| * the execution is successful and the model has at least one output operand that is not |
| * fully-specified. |
| * - Duration of execution. Unless measure is YES and the execution is successful, all times |
| * must be reported as UINT64_MAX. A driver may choose to report any time as UINT64_MAX, |
| * indicating that measurement is not available. |
| */ |
| virtual ExecutionResult<std::pair<std::vector<OutputShape>, Timing>> execute( |
| const Request& request, MeasureTiming measure, const OptionalTimePoint& deadline, |
| const OptionalTimeoutDuration& loopTimeoutDuration) const = 0; |
| |
| /** |
| * Launch a fenced asynchronous execution on a prepared model. |
| * |
| * The execution is performed asynchronously with respect to the caller. |
| * IPreparedModel::executeFenced must verify its inputs are correct, and the usages of memory |
| * pools allocated by IDevice::allocate are valid. If there is an error, |
| * IPreparedModel::executeFenced must immediately return {@link ErrorStatus::INVALID_ARGUMENT} |
| * as a GeneralError. If the inputs to the function are valid and there is no error, |
| * IPreparedModel::executeFenced must dispatch an asynchronous task to perform the execution in |
| * the background, and immediately return with a sync fence that will be signaled once the |
| * execution is completed and a callback that can be used by the client to query the duration |
| * and runtime error status. If the task has finished before the call returns, an empty handle |
| * may be returned for syncFence. The execution must wait for all the sync fences (if any) in |
| * waitFor to be signaled before starting the actual execution. |
| * |
| * When the asynchronous task has finished its execution, it must immediately signal the |
| * syncFence returned from the IPreparedModel::executeFenced call. After the syncFence is |
| * signaled, the task must not modify the content of any data object referenced by request |
| * (described by the {@link DataLocation} of a {@link Request::Argument}). |
| * |
| * IPreparedModel::executeFenced may be called with an optional deadline and an optional |
| * duration. If the execution is not able to be completed before the provided deadline or within |
| * the timeout duration (measured from when all sync fences in waitFor are signaled), whichever |
| * comes earlier, the execution may be aborted, and either {@link |
| * ErrorStatus::MISSED_DEADLINE_TRANSIENT} or {@link ErrorStatus::MISSED_DEADLINE_PERSISTENT} |
| * may be returned as an GeneralError. The error due to an abort must be sent the same way as |
| * other errors, described above. |
| * |
| * If any of the sync fences in waitFor changes to error status after the |
| * IPreparedModel::executeFenced call succeeds, or the execution is aborted because it cannot |
| * finish before the deadline has been reached or the duration has elapsed, the driver must |
| * immediately set the returned syncFence to error status. |
| * |
| * @param request The input and output information on which the prepared model is to be |
| * executed. |
| * @param waitFor A vector of sync fence file descriptors. The execution must wait for all sync |
| * fence to be signaled before starting the task. |
| * @param measure Specifies whether or not to measure duration of the execution. |
| * @param deadline The time by which execution is expected to complete. If the execution cannot |
| * be finished by the deadline, the execution may be aborted. |
| * @param loopTimeoutDuration The maximum amount of time that should be spent executing a {@link |
| * OperationType::WHILE} operation. If a loop condition model does not output `false` within |
| * this duration, the execution must be aborted. If no loop timeout duration is provided, |
| * the maximum amount of time is {@link LoopTimeoutDurationNs::DEFAULT}. When provided, the |
| * duration must not exceed {@link LoopTimeoutDurationNs::MAXIMUM}. |
| * @param timeoutDurationAfterFence The timeout duration within which the execution is expected |
| * to complete after all sync fences in waitFor are signaled. |
| * @return A pair consisting of: |
| * - A syncFence that will be triggered when the task is completed. The syncFence will be |
| * set to error if critical error occurs when doing actual evaluation. |
| * - A callback can be used to query information like duration and detailed runtime error |
| * status when the task is completed. |
| */ |
| virtual GeneralResult<std::pair<SyncFence, ExecuteFencedInfoCallback>> executeFenced( |
| const Request& request, const std::vector<SyncFence>& waitFor, MeasureTiming measure, |
| const OptionalTimePoint& deadline, const OptionalTimeoutDuration& loopTimeoutDuration, |
| const OptionalTimeoutDuration& timeoutDurationAfterFence) const = 0; |
| |
| /** |
| * Return the resource that the IPreparedModel wraps, or any empty std::any. |
| * |
| * This method is used for IDevice::allocate. |
| * |
| * @return std::any containing the underlying resource. |
| */ |
| virtual std::any getUnderlyingResource() const = 0; |
| |
| // Public virtual destructor to allow objects to be stored (and destroyed) as smart pointers. |
| // E.g., std::unique_ptr<IPreparedModel>. |
| virtual ~IPreparedModel() = default; |
| |
| protected: |
| // Protect the non-destructor special member functions to prevent object slicing. |
| IPreparedModel() = default; |
| IPreparedModel(const IPreparedModel&) = default; |
| IPreparedModel(IPreparedModel&&) noexcept = default; |
| IPreparedModel& operator=(const IPreparedModel&) = default; |
| IPreparedModel& operator=(IPreparedModel&&) noexcept = default; |
| }; |
| |
| } // namespace android::nn |
| |
| #endif // ANDROID_FRAMEWORKS_ML_NN_COMMON_NNAPI_IPREPARED_MODEL_H |