1 /* Copyright 2017 The TensorFlow Authors. All Rights Reserved. 2 3 Licensed under the Apache License, Version 2.0 (the "License"); 4 you may not use this file except in compliance with the License. 5 You may obtain a copy of the License at 6 7 http://www.apache.org/licenses/LICENSE-2.0 8 9 Unless required by applicable law or agreed to in writing, software 10 distributed under the License is distributed on an "AS IS" BASIS, 11 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 12 See the License for the specific language governing permissions and 13 limitations under the License. 14 ==============================================================================*/ 15 16 #ifndef TENSORFLOW_PYTHON_GRAPPLER_COST_ANALYZER_H_ 17 #define TENSORFLOW_PYTHON_GRAPPLER_COST_ANALYZER_H_ 18 19 #include <iostream> 20 #include "tensorflow/core/framework/cost_graph.pb.h" 21 #include "tensorflow/core/framework/graph.pb.h" 22 #include "tensorflow/core/framework/tensor_shape.pb.h" 23 #include "tensorflow/core/grappler/clusters/cluster.h" 24 #include "tensorflow/core/grappler/costs/analytical_cost_estimator.h" 25 #include "tensorflow/core/grappler/costs/cost_estimator.h" 26 #include "tensorflow/core/grappler/costs/measuring_cost_estimator.h" 27 #include "tensorflow/core/grappler/costs/op_performance_data.pb.h" 28 29 namespace tensorflow { 30 class GraphDef; 31 class CostGraphDef; 32 33 namespace grappler { 34 struct GrapplerItem; 35 36 // Aggregated perf summary for ops of the same type in a graph. 37 struct OpPerfSummary { 38 string name; 39 int64 count; 40 int64 time; 41 int64 compute_time; 42 int64 memory_time; 43 // Upper and lower bound for estimated time. 44 int64 time_upper; 45 int64 time_lower; 46 }; 47 48 // Generate op-level performance insights on compute/memory 49 // efficiency, as well as graph-level aggregated performance statistics. 50 class CostAnalyzer { 51 public: 52 explicit CostAnalyzer(const GrapplerItem& item, Cluster* cluster, 53 const string& suffix); 54 Status GenerateReport(std::ostream& os, bool per_node_report, bool verbose); 55 56 private: 57 void PredictCosts(CostEstimator* cost_estimator, CostGraphDef* cost_graph, 58 int64* total_time); 59 void GatherCosts(); 60 void PreprocessCosts(); 61 void AnalyzeCosts(); 62 void SortOpsByTime(std::map<string, OpPerfSummary> ops); 63 void PrintAnalysis(std::ostream& os, bool per_node_report, 64 bool verbose) const; 65 66 const GrapplerItem* item_; 67 MeasuringCostEstimator measure_estimator_; 68 AnalyticalCostEstimator analytical_estimator_; 69 OpPerformanceList op_perf_; 70 OpPerformanceList op_perf_analytical_; 71 int64 total_time_measured_; 72 int64 total_time_analytical_; 73 std::vector<OpPerfSummary> ops_; 74 int64 total_time_measured_serialized_; 75 int64 total_time_analytical_upper_; 76 int64 total_time_analytical_lower_; 77 string suffix_; 78 }; 79 80 } // end namespace grappler 81 } // end namespace tensorflow 82 83 #endif // TENSORFLOW_PYTHON_GRAPPLER_COST_ANALYZER_H_ 84