1 /* 2 * Copyright (C) 2018 The Android Open Source Project 3 * 4 * Licensed under the Apache License, Version 2.0 (the "License"); 5 * you may not use this file except in compliance with the License. 6 * You may obtain a copy of the License at 7 * 8 * http://www.apache.org/licenses/LICENSE-2.0 9 * 10 * Unless required by applicable law or agreed to in writing, software 11 * distributed under the License is distributed on an "AS IS" BASIS, 12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 13 * See the License for the specific language governing permissions and 14 * limitations under the License. 15 */ 16 17 #ifndef ANDROID_PACKAGES_MODULES_NEURALNETWORKS_COMMON_TYPES_TRACING_H 18 #define ANDROID_PACKAGES_MODULES_NEURALNETWORKS_COMMON_TYPES_TRACING_H 19 20 #ifndef NN_COMPATIBILITY_LIBRARY_BUILD 21 #define ATRACE_TAG ATRACE_TAG_NNAPI 22 #include <utils/Trace.h> 23 #endif // NN_COMPATIBILITY_LIBRARY_BUILD 24 25 // Neural Networks API (NNAPI) systracing 26 // 27 // Primary goal of the tracing is to capture and present timings for NNAPI. 28 // (Other uses include providing visibility to split of execution between 29 // drivers and the CPU fallback, and the ability to visualize call sequences). 30 // 31 // The tracing has three parts: 32 // 1 Trace macros defined in this file and used throughout the codebase, 33 // modelled after and using atrace. These implement a naming convention for 34 // the tracepoints, interpreted by the systrace parser. 35 // 2 Android systrace (atrace) on-device capture and host-based analysis. 36 // 3 A systrace parser (TODO) to summarize the timings. 37 // 38 // For an overview and introduction, please refer to the "NNAPI Systrace design 39 // and HOWTO" (internal Docs for now). This header doesn't try to replicate all 40 // the information in that document. For the contract between traces in code and 41 // the statistics created by the systrace parser, see 42 // tools/systrace-parser/contract-between-code-and-parser.txt. 43 // 44 // Glossary: 45 // - Phase: stage in processing (e.g., Preparation, Compilation, Execution); 46 // Overall phase nests rest, Execution nests Input/Output, Transformation, 47 // Computation and Results; optionally Executions can be nested in a 48 // Warmup and Benchmark - otherwise not nested (Initialization phase 49 // functions may occur inside other phases but will be counted out during 50 // analysis). Nested phases (other than Initialization) are analysed as a 51 // breakdown of the parent phase. 52 // - Layer: component in the stack (from top to bottom: App, Runtime, IPC, 53 // Driver/CPU). Calls to lower layers are typically nested within calls to upper 54 // layers. 55 // - Bucket: unit of timing analysis, the combination of Phase and Layer (and 56 // thus also typically nested). 57 // - Detail: specific unit being executed, typically a function. 58 59 // Convenience macros to be used in the code (phases defined below). 60 // (Macros so that string concatenation is done at compile time). 61 // 62 // These exist in three variants: 63 // - Simple (NNTRACE_<layer and potentially phase>) - to be used when only one 64 // Phase is active within a scope 65 // - "Switch" (NNTRACE_<...>_SWITCH) - to be used when multiple Phases 66 // share a scope (e.g., transformation of data and computation in same 67 // function). 68 // - "Subtract" (NNTRACE_<...>_SUBTRACT) - to be used when nesting is violated 69 // and the time should be subtracted from the parent scope 70 // Arguments: 71 // - phase: one of the NNTRACE_PHASE_* macros defined below. 72 // - detail: free-form string constant, typically function name. 73 // Example usage: 74 // // Simple 75 // int ANeuralNetworksMemory_createFromFd(...) { 76 // NNTRACE_RT(NNTRACE_PHASE_PREPARATION, "ANeuralNetworksMemory_createFromFd"); 77 // } 78 // // Switch 79 // bool concatenationFloat32(...) { 80 // NNTRACE_TRANS("concatenationFloat32"); // Transformation of data begins 81 // ... 82 // NNTRACE_COMP_SWITCH("optimized_ops::Concatenation"); // Transformation 83 // // ends and computation 84 // // begins 85 // } 86 // // Subtract 87 // static int compile(...) { 88 // NNTRACE_FULL(NNTRACE_LAYER_IPC, NNTRACE_PHASE_COMPILATION, "prepareModel"); 89 // device->getInterface()->prepareModel(..., preparedModelCallback); 90 // preparedModelCallback->wait() 91 // } 92 // ErrorStatus VersionedIDevice::prepareModel(...) { 93 // ... IPC work ... 94 // { 95 // NNTRACE_FULL_SUBTRACT(NNTRACE_LAYER_RUNTIME, NNTRACE_PHASE_COMPILATION, 96 // "VersionedIDevice::prepareModel"); 97 // ... Runtime work ... 98 // } 99 // ... IPC work ... 100 // } 101 // 102 // Layer Application - For native applications (e.g., unit tests) 103 #define NNTRACE_APP(phase, detail) NNTRACE_FULL(NNTRACE_LAYER_APPLICATION, phase, detail) 104 #define NNTRACE_APP_SWITCH(phase, detail) \ 105 NNTRACE_FULL_SWITCH(NNTRACE_LAYER_APPLICATION, phase, detail) 106 // Layer Runtime - For the NNAPI runtime 107 #define NNTRACE_RT(phase, detail) NNTRACE_FULL(NNTRACE_LAYER_RUNTIME, phase, detail) 108 #define NNTRACE_RT_SWITCH(phase, detail) NNTRACE_FULL_SWITCH(NNTRACE_LAYER_RUNTIME, phase, detail) 109 // Layer CPU - CPU executor 110 #define NNTRACE_CPU(phase, detail) NNTRACE_FULL(NNTRACE_LAYER_CPU, phase, detail) 111 #define NNTRACE_COMP(detail) NNTRACE_FULL(NNTRACE_LAYER_CPU, NNTRACE_PHASE_COMPUTATION, detail) 112 #define NNTRACE_COMP_SWITCH(detail) \ 113 NNTRACE_FULL_SWITCH(NNTRACE_LAYER_CPU, NNTRACE_PHASE_COMPUTATION, detail) 114 #define NNTRACE_TRANS(detail) NNTRACE_FULL(NNTRACE_LAYER_CPU, NNTRACE_PHASE_TRANSFORMATION, detail) 115 116 // Fully specified macros to be used when no convenience wrapper exists for your 117 // need. 118 #define NNTRACE_FULL(layer, phase, detail) NNTRACE_NAME_1(("[NN_" layer "_" phase "]" detail)) 119 #define NNTRACE_FULL_SWITCH(layer, phase, detail) \ 120 NNTRACE_NAME_SWITCH(("[SW][NN_" layer "_" phase "]" detail)) 121 #define NNTRACE_FULL_SUBTRACT(layer, phase, detail) \ 122 NNTRACE_NAME_1(("[SUB][NN_" layer "_" phase "]" detail)) 123 // Raw macro without scoping requirements, for special cases 124 #define NNTRACE_FULL_RAW(layer, phase, detail) \ 125 android::ScopedTrace PASTE(___tracer, __LINE__)(ATRACE_TAG, ("[NN_" layer "_" phase "]" detail)) 126 127 // Tracing buckets - for calculating timing summaries over. 128 // 129 // Application-only phases 130 #define NNTRACE_PHASE_OVERALL "PO" // Overall program, e.g., one benchmark case 131 #define NNTRACE_PHASE_WARMUP "PWU" // Warmup (nesting multiple executions) 132 #define NNTRACE_PHASE_BENCHMARK "PBM" // Benchmark (nesting multiple executions) 133 // Main phases, usable by all layers 134 #define NNTRACE_PHASE_INITIALIZATION "PI" // Initialization - not related to a model 135 #define NNTRACE_PHASE_PREPARATION "PP" // Model construction 136 #define NNTRACE_PHASE_COMPILATION "PC" // Model compilation 137 #define NNTRACE_PHASE_EXECUTION "PE" // Executing the model 138 #define NNTRACE_PHASE_TERMINATION "PT" // Tearing down 139 #define NNTRACE_PHASE_UNSPECIFIED "PU" // Helper code called from multiple phases 140 // Subphases of execution 141 #define NNTRACE_PHASE_INPUTS_AND_OUTPUTS "PIO" // Setting inputs/outputs and allocating buffers 142 #define NNTRACE_PHASE_TRANSFORMATION "PTR" // Transforming data for computation 143 #define NNTRACE_PHASE_COMPUTATION "PCO" // Computing operations' outputs 144 #define NNTRACE_PHASE_RESULTS "PR" // Reading out results 145 // Layers 146 #define NNTRACE_LAYER_APPLICATION "LA" 147 #define NNTRACE_LAYER_RUNTIME "LR" 148 #define NNTRACE_LAYER_IPC "LI" 149 #define NNTRACE_LAYER_DRIVER "LD" 150 #define NNTRACE_LAYER_CPU "LC" 151 #define NNTRACE_LAYER_OTHER "LO" 152 #define NNTRACE_LAYER_UTILITY "LU" // Code used from multiple layers 153 154 #ifndef NN_COMPATIBILITY_LIBRARY_BUILD 155 156 // Implementation 157 // 158 // Almost same as ATRACE_NAME, but enforcing explicit distinction between 159 // phase-per-scope and switching phases. 160 // 161 // Basic trace, one per scope allowed to enforce disjointness 162 #define NNTRACE_NAME_1(name) ::android::ScopedTrace ___tracer_1(ATRACE_TAG, name) 163 // Switching trace, more than one per scope allowed, translated by 164 // systrace_parser.py. This is mainly useful for tracing multiple phases through 165 // one function / scope. 166 #define NNTRACE_NAME_SWITCH(name) \ 167 ::android::ScopedTrace PASTE(___tracer, __LINE__)(ATRACE_TAG, name); \ 168 (void)___tracer_1 // ensure switch is only used after a basic trace 169 170 #else 171 172 #define NNTRACE_NAME_1(name) // empty 173 #define NNTRACE_NAME_SWITCH(name) // empty 174 175 #endif // NN_COMPATIBILITY_LIBRARY_BUILD 176 177 // Disallow use of raw ATRACE macros 178 #undef ATRACE_NAME 179 #undef ATRACE_CALL 180 181 #endif // ANDROID_PACKAGES_MODULES_NEURALNETWORKS_COMMON_TYPES_TRACING_H 182