1 /* 2 * Copyright (C) 2017 The Android Open Source Project 3 * 4 * Licensed under the Apache License, Version 2.0 (the "License"); 5 * you may not use this file except in compliance with the License. 6 * You may obtain a copy of the License at 7 * 8 * http://www.apache.org/licenses/LICENSE-2.0 9 * 10 * Unless required by applicable law or agreed to in writing, software 11 * distributed under the License is distributed on an "AS IS" BASIS, 12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 13 * See the License for the specific language governing permissions and 14 * limitations under the License. 15 */ 16 17 #ifndef ANDROID_PACKAGES_MODULES_NEURALNETWORKS_RUNTIME_EXECUTION_CALLBACK_H 18 #define ANDROID_PACKAGES_MODULES_NEURALNETWORKS_RUNTIME_EXECUTION_CALLBACK_H 19 20 #include <android-base/thread_annotations.h> 21 #include <nnapi/Types.h> 22 23 #include <condition_variable> 24 #include <functional> 25 #include <mutex> 26 #include <thread> 27 #include <vector> 28 29 namespace android::nn { 30 31 // This class used to be a HIDL callback class to receive the results of 32 // IDevice::execute* asynchronously. It's not used for this anymore. 33 // 34 // TODO(b/122316159): Replace ExecutionCallback and CallbackEvent with a new 35 // class like AsyncTaskEvent. 36 /** 37 * The ExecutionCallback class is used to receive the results of the execution 38 * from a task executing asynchronously with respect to the runtime. If a 39 * calling thread calls wait or get* on a ExecutionCallback object and the 40 * corresponding asynchronous task has not finished the execution, the calling 41 * thread will block until the asynchronous task has called one of the notify* 42 * methods. 43 * 44 * If the callback object is notified more than once, only the results of the 45 * first call to notify* are used, and the results from subsequent calls are 46 * discarded. 47 */ 48 class ExecutionCallback { 49 using ExecutionFinish = 50 std::function<ErrorStatus(ErrorStatus, const std::vector<OutputShape>&)>; 51 52 public: 53 /** 54 * ExecutionCallback::notify marks the callback object with the results 55 * (error status, dynamic output shapes, and timing information) of the 56 * asynchronous execution that held this callback and enables all prior and 57 * future wait calls on the ExecutionCallback object to proceed. 58 * 59 * If the callback object is notified more than once, only the results of 60 * the first call to notify* are used, and the results from subsequent calls 61 * are discarded. 62 * 63 * @param status Error status returned from launching the asynchronous task 64 * (if the launch fails) or from the asynchronous task itself (if the 65 * launch succeeds). Must be: 66 * - NONE if the asynchronous execution was successful 67 * - DEVICE_UNAVAILABLE if driver is offline or busy 68 * - GENERAL_FAILURE if the asynchronous task resulted in an unspecified 69 * error 70 * - OUTPUT_INSUFFICIENT_SIZE if at least one output operand buffer is 71 * not large enough to store the corresponding output 72 * - INVALID_ARGUMENT if one of the input arguments to prepareModel is 73 * invalid 74 * - MISSED_DEADLINE_* if the deadline could not be met 75 * - RESOURCE_EXHAUSTED_* if the execution was aborted by the driver 76 * @param outputShapes A list of shape information of model output operands. 77 * The index into "outputShapes" corresponds to the index of the output 78 * operand in the Request outputs vector. outputShapes must be empty 79 * unless the status is either NONE or OUTPUT_INSUFFICIENT_SIZE. 80 * @param Timing Duration of execution. Unless MeasureTiming::YES was passed 81 * when launching the execution and status is NONE, all times must be 82 * reported as UINT64_MAX. A driver may choose to report any time as 83 * UINT64_MAX, indicating that particular measurement is not available. 84 */ 85 void notify(ErrorStatus status, const std::vector<OutputShape>& outputShapes, 86 const Timing& timing); 87 88 /** 89 * ExecutionCallback::wait blocks until notify* has been called on the 90 * callback object. 91 */ 92 void wait() const; 93 94 /** 95 * Retrieves the error status returned from the asynchronous task launched 96 * by IPreparedModel::execute* (but not by 97 * IPreparedModel::executeSynchronously*). If IPreparedModel::execute* has 98 * not finished asynchronously executing, this call will block until the 99 * asynchronous task notifies the object. 100 * 101 * @return status Error status returned from launching the asynchronous task 102 * (if the launch fails) or from the asynchronous task itself (if the 103 * launch succeeds). Must be: 104 * - NONE if the asynchronous execution was successful 105 * - DEVICE_UNAVAILABLE if driver is offline or busy 106 * - GENERAL_FAILURE if the asynchronous task resulted in an unspecified 107 * error 108 * - OUTPUT_INSUFFICIENT_SIZE if at least one output operand buffer is 109 * not large enough to store the corresponding output 110 * - INVALID_ARGUMENT if one of the input arguments to prepareModel is 111 * invalid 112 * - MISSED_DEADLINE_* if the deadline could not be met 113 * - RESOURCE_EXHAUSTED_* if the task was aborted by the driver 114 * - DEAD_OBJECT if the driver crashed without returning a result 115 */ 116 ErrorStatus getStatus() const; 117 118 /** 119 * Retrieves the output shapes returned from the asynchronous task launched 120 * by either IPreparedModel::execute_1_2 or IPreparedModel::execute_1_3. If 121 * IPreparedModel::execute_1_2 or IPreparedModel::execute_1_3 has not 122 * finished asynchronously executing, this call will block until the 123 * asynchronous task notifies the object. 124 * 125 * If the asynchronous task was launched by IPreparedModel::execute, an 126 * empty vector will be returned. 127 * 128 * @return outputShapes A list of shape information of model output 129 * operands. The index into "outputShapes" corresponds to the index of 130 * the output operand in the Request outputs vector. outputShapes must 131 * be empty unless the status is either NONE or 132 * OUTPUT_INSUFFICIENT_SIZE. outputShaps may be empty if the status is 133 * NONE and all model output operands are fully-specified at execution 134 * time. outputShapes must have the same number of elements as the 135 * number of model output operands if the status is 136 * OUTPUT_INSUFFICIENT_SIZE, or if the status is NONE and the model has 137 * at least one output operand that is not fully-specified. 138 */ 139 const std::vector<OutputShape>& getOutputShapes() const; 140 141 /** 142 * Retrieves the duration of execution of the asynchronous task launched by 143 * by either IPreparedModel::execute_1_2 or IPreparedModel::execute_1_3. If 144 * IPreparedModel::execute_1_2 or IPreparedModel::execute_1_3 has not 145 * finished asynchronously executing, this call will block until the 146 * asynchronous task notifies the object. 147 * 148 * If the asynchronous task was launched by IPreparedModel::execute, every 149 * time must be UINT64_MAX. 150 * 151 * @return timing Duration of the execution. Every time must be UINT64_MAX 152 * unless the status is NONE. 153 */ 154 Timing getTiming() const; 155 156 /** 157 * ExecutionCallback::bindThread binds a thread to the ExecutionCallback 158 * object. The bound thread is later joined by ExecutionCallback::wait or 159 * ExecutionCallback::get*. 160 * 161 * Once a thread is bound with ExecutionCallback::bindThread, the client 162 * code must ensure that ExecutionCallback::wait or ExecutionCallback::get* 163 * has been called before the ExecutionCallback object is destroyed. 164 * 165 * The bound thread must not call any ExecutionCallback method with the 166 * exception of ExecutionCallback::notify*, which it must call when the 167 * thread has finished its computation. 168 * 169 * ExecutionCallback::bindThread can be called at most once on a given 170 * callback object. 171 * 172 * @param asyncThread Thread to be bound to the callback object. The thread 173 * object must represent a thread of execution -- i.e., 174 * std::thread::joinable() must be true. 175 * @return bool True if successful, false if thread was not properly bound. 176 */ 177 bool bindThread(std::thread asyncThread); 178 179 /** 180 * ExecutionCallback::setOnFinish binds a callback to the ExecutionCallback 181 * object that will be executed during one of the ExecutionCallback::notify* 182 * calls but before any calls to wait or get* return. This provided callback 183 * is provided with both the ErrorStatus and the output shapes from 184 * ExecutionCallback::notify*. 185 * 186 * The bound function must not synchronize with or otherwise access the 187 * callback object it is bound to, as this could cause a deadlock. 188 * 189 * This call will not bind the provided callback if any of the following 190 * occur: 191 * (1) the provided callback is invalid (i.e., "(bool) finish" is false) 192 * (2) ExecutionCallback already contains a bound callback 193 * (3) ExecutionCallback has already been notified with results 194 * 195 * @param finish Callback to be executed when ExecutionCallback is notified 196 * with results. 197 */ 198 void setOnFinish(const ExecutionFinish& finish); 199 200 private: 201 /* 202 * ExecutionCallback::notifyInternal stores the results of the execution 203 * (status, output shapes, and timing information) in the ExecutionCallback 204 * object and invokes the bound callback function "mOnFinish" (if present) 205 * before any call to wait or get* return. It then enables all prior and 206 * future wait calls on the ExecutionCallback object to proceed. 207 */ 208 void notifyInternal(ErrorStatus errorStatus, std::vector<OutputShape> outputShapes, 209 Timing timing); 210 211 // members 212 mutable std::mutex mMutex; 213 mutable std::condition_variable mCondition; 214 mutable std::thread mThread GUARDED_BY(mMutex); 215 ExecutionFinish mOnFinish GUARDED_BY(mMutex); 216 bool mNotified GUARDED_BY(mMutex) = false; 217 ErrorStatus mErrorStatus = ErrorStatus::GENERAL_FAILURE; 218 std::vector<OutputShape> mOutputShapes; 219 Timing mTiming = {}; 220 }; 221 222 } // namespace android::nn 223 224 #endif // ANDROID_PACKAGES_MODULES_NEURALNETWORKS_RUNTIME_EXECUTION_CALLBACK_H 225