1 /* Copyright 2017 The TensorFlow Authors All Rights Reserved.
2 
3 Licensed under the Apache License, Version 2.0 (the "License");
4 you may not use this file except in compliance with the License.
5 You may obtain a copy of the License at
6 
7     http://www.apache.org/licenses/LICENSE-2.0
8 
9 Unless required by applicable law or agreed to in writing, software
10 distributed under the License is distributed on an "AS IS" BASIS,
11 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 See the License for the specific language governing permissions and
13 limitations under the License.
14 ==============================================================================*/
15 
16 #include "tensorflow/core/profiler/rpc/client/dump_tpu_profile.h"
17 
18 #include <cstdio>
19 #include <ctime>
20 #include <vector>
21 
22 #include "tensorflow/core/lib/core/errors.h"
23 #include "tensorflow/core/lib/io/compression.h"
24 #include "tensorflow/core/lib/io/path.h"
25 #include "tensorflow/core/lib/strings/str_util.h"
26 #include "tensorflow/core/lib/strings/strcat.h"
27 #include "tensorflow/core/platform/env.h"
28 #include "tensorflow/core/platform/protobuf.h"
29 // Windows.h #defines ERROR, but it is also used in
30 // tensorflow/core/util/event.proto
31 #undef ERROR
32 #include "tensorflow/core/profiler/op_profile.pb.h"
33 #include "tensorflow/core/profiler/rpc/client/trace_events_to_json.h"
34 #include "tensorflow/core/profiler/trace_events.pb.h"
35 #include "tensorflow/core/util/events_writer.h"
36 
37 namespace tensorflow {
38 
39 namespace profiler {
40 namespace client {
41 namespace {
42 
43 using ::tensorflow::io::JoinPath;
44 using ::tensorflow::protobuf::util::JsonOptions;
45 using ::tensorflow::protobuf::util::MessageToJsonString;
46 using ::tensorflow::str_util::EndsWith;
47 using ::tensorflow::strings::StrCat;
48 
49 constexpr char kGraphRunPrefix[] = "tpu_profiler.hlo_graph.";
50 constexpr char kJsonOpProfileFileName[] = "op_profile.json";
51 constexpr char kJsonTraceFileName[] = "trace.json.gz";
52 constexpr char kProfilePluginDirectory[] = "plugins/profile/";
53 constexpr char kProtoTraceFileName[] = "trace";
54 
55 constexpr char kFlatProfilerFileName[] = "flat_profiler.pb";
56 constexpr char kTfStatsHelperSuffix[] = "tf_stats_helper_result";
57 
WriteGzippedDataToFile(const string & filename,const string & data)58 Status WriteGzippedDataToFile(const string& filename, const string& data) {
59   std::unique_ptr<WritableFile> file;
60   TF_RETURN_IF_ERROR(Env::Default()->NewWritableFile(filename, &file));
61   io::ZlibCompressionOptions options = io::ZlibCompressionOptions::GZIP();
62   io::ZlibOutputBuffer buffer(file.get(), options.input_buffer_size,
63                               options.output_buffer_size, options);
64   TF_RETURN_IF_ERROR(buffer.Init());
65   TF_RETURN_IF_ERROR(buffer.Append(data));
66   TF_RETURN_IF_ERROR(buffer.Close());
67   TF_RETURN_IF_ERROR(file->Close());
68   return Status::OK();
69 }
70 
DumpTraceToLogDirectory(StringPiece run_dir,const string & host_prefix,const string & encoded_trace,std::ostream * os)71 Status DumpTraceToLogDirectory(StringPiece run_dir, const string& host_prefix,
72                                const string& encoded_trace, std::ostream* os) {
73   string proto_path =
74       JoinPath(run_dir, StrCat(host_prefix, kProtoTraceFileName));
75   TF_RETURN_IF_ERROR(
76       WriteStringToFile(Env::Default(), proto_path, encoded_trace));
77   LOG(INFO) << "Dumped raw-proto trace data to " << proto_path;
78 
79   string json_path = JoinPath(run_dir, StrCat(host_prefix, kJsonTraceFileName));
80   Trace trace;
81   trace.ParseFromString(encoded_trace);
82   if (os) {
83     *os << "Trace contains " << trace.trace_events_size() << " events."
84         << std::endl;
85   }
86   TF_RETURN_IF_ERROR(
87       WriteGzippedDataToFile(json_path, TraceEventsToJson(trace)));
88   if (os) {
89     *os << "Dumped JSON trace data to " << json_path << std::endl;
90   }
91   return Status::OK();
92 }
93 
DumpOpProfileToLogDirectory(StringPiece run_dir,const string & host_prefix,const op_profile::Profile & profile,std::ostream * os)94 Status DumpOpProfileToLogDirectory(StringPiece run_dir,
95                                    const string& host_prefix,
96                                    const op_profile::Profile& profile,
97                                    std::ostream* os) {
98   string path = JoinPath(run_dir, StrCat(host_prefix, kJsonOpProfileFileName));
99   string json;
100   JsonOptions options;
101   options.always_print_primitive_fields = true;
102   auto status = MessageToJsonString(profile, &json, options);
103   if (!status.ok()) {
104     return errors::Internal(
105         "Failed to convert op profile to json. Skipping... ",
106         string(status.error_message()));
107   }
108   TF_RETURN_IF_ERROR(WriteStringToFile(Env::Default(), path, json));
109   if (os) {
110     *os << "Dumped json op profile data to " << path << std::endl;
111   }
112   return Status::OK();
113 }
114 
DumpToolDataToLogDirectory(StringPiece run_dir,const string & host_prefix,const ProfileToolData & tool,std::ostream * os)115 Status DumpToolDataToLogDirectory(StringPiece run_dir,
116                                   const string& host_prefix,
117                                   const ProfileToolData& tool,
118                                   std::ostream* os) {
119   // Don't save the intermediate results for combining the per host tool data.
120   if (EndsWith(tool.name(), kFlatProfilerFileName) ||
121       EndsWith(tool.name(), kTfStatsHelperSuffix))
122     return Status::OK();
123   string path = JoinPath(run_dir, StrCat(host_prefix, tool.name()));
124   TF_RETURN_IF_ERROR(WriteStringToFile(Env::Default(), path, tool.data()));
125   if (os) {
126     *os << "Dumped tool data for " << tool.name() << " to " << path
127         << std::endl;
128   }
129   return Status::OK();
130 }
131 
132 }  // namespace
133 
WriteTensorboardTPUProfile(const string & logdir,const string & run,const string & host,const ProfileResponse & response,std::ostream * os)134 Status WriteTensorboardTPUProfile(const string& logdir, const string& run,
135                                   const string& host,
136                                   const ProfileResponse& response,
137                                   std::ostream* os) {
138   // Dumps profile data to <logdir>/plugins/profile/<run>/.
139   string host_prefix = host.empty() ? "" : StrCat(host, ".");
140   string profile_run_dir = JoinPath(logdir, kProfilePluginDirectory, run);
141   *os << "Creating directory: " << profile_run_dir;
142   TF_RETURN_IF_ERROR(Env::Default()->RecursivelyCreateDir(profile_run_dir));
143 
144   // Ignore computation_graph for now.
145   if (!response.encoded_trace().empty()) {
146     LOG(INFO) << "Converting trace events to TraceViewer JSON.";
147     TF_RETURN_IF_ERROR(DumpTraceToLogDirectory(profile_run_dir, host_prefix,
148                                                response.encoded_trace(), os));
149   }
150   if (response.has_op_profile() && (response.op_profile().has_by_program() ||
151                                     response.op_profile().has_by_category())) {
152     TF_RETURN_IF_ERROR(DumpOpProfileToLogDirectory(profile_run_dir, host_prefix,
153                                                    response.op_profile(), os));
154   }
155   for (const auto& tool_data : response.tool_data()) {
156     TF_RETURN_IF_ERROR(DumpToolDataToLogDirectory(profile_run_dir, host_prefix,
157                                                   tool_data, os));
158   }
159 
160   return Status::OK();
161 }
162 
163 }  // namespace client
164 }  // namespace profiler
165 }  // namespace tensorflow
166