1 /*
2  * Copyright (C) 2020 The Android Open Source Project
3  *
4  * Licensed under the Apache License, Version 2.0 (the "License");
5  * you may not use this file except in compliance with the License.
6  * You may obtain a copy of the License at
7  *
8  *      http://www.apache.org/licenses/LICENSE-2.0
9  *
10  * Unless required by applicable law or agreed to in writing, software
11  * distributed under the License is distributed on an "AS IS" BASIS,
12  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13  * See the License for the specific language governing permissions and
14  * limitations under the License.
15  */
16 
17 #include "src/trace_processor/rpc/query_result_serializer.h"
18 
19 #include <vector>
20 
21 #include "perfetto/protozero/packed_repeated_fields.h"
22 #include "perfetto/protozero/proto_utils.h"
23 #include "perfetto/protozero/scattered_heap_buffer.h"
24 #include "src/trace_processor/iterator_impl.h"
25 
26 #include "protos/perfetto/trace_processor/trace_processor.pbzero.h"
27 
28 namespace perfetto {
29 namespace trace_processor {
30 
31 namespace {
32 
33 namespace pu = ::protozero::proto_utils;
34 using BatchProto = protos::pbzero::QueryResult::CellsBatch;
35 using ResultProto = protos::pbzero::QueryResult;
36 
37 // The reserved field in trace_processor.proto.
38 static constexpr uint32_t kPaddingFieldId = 7;
39 
MakeLenDelimTag(uint32_t field_num)40 uint8_t MakeLenDelimTag(uint32_t field_num) {
41   uint32_t tag = pu::MakeTagLengthDelimited(field_num);
42   PERFETTO_DCHECK(tag <= 127);  // Must fit in one byte.
43   return static_cast<uint8_t>(tag);
44 }
45 
46 }  // namespace
47 
QueryResultSerializer(Iterator iter)48 QueryResultSerializer::QueryResultSerializer(Iterator iter)
49     : iter_(iter.take_impl()), num_cols_(iter_->ColumnCount()) {}
50 
51 QueryResultSerializer::~QueryResultSerializer() = default;
52 
Serialize(std::vector<uint8_t> * buf)53 bool QueryResultSerializer::Serialize(std::vector<uint8_t>* buf) {
54   const size_t slice = batch_split_threshold_ + 4096;
55   protozero::HeapBuffered<protos::pbzero::QueryResult> result(slice, slice);
56   bool has_more = Serialize(result.get());
57   auto arr = result.SerializeAsArray();
58   buf->insert(buf->end(), arr.begin(), arr.end());
59   return has_more;
60 }
61 
Serialize(protos::pbzero::QueryResult * res)62 bool QueryResultSerializer::Serialize(protos::pbzero::QueryResult* res) {
63   PERFETTO_CHECK(!eof_reached_);
64 
65   if (!did_write_column_names_) {
66     SerializeColumnNames(res);
67     did_write_column_names_ = true;
68   }
69 
70   // In case of an error we still want to go through SerializeBatch(). That will
71   // write an empty batch with the EOF marker. Errors can happen also in the
72   // middle of a query, not just before starting it.
73 
74   SerializeBatch(res);
75   MaybeSerializeError(res);
76   return !eof_reached_;
77 }
78 
SerializeBatch(protos::pbzero::QueryResult * res)79 void QueryResultSerializer::SerializeBatch(protos::pbzero::QueryResult* res) {
80   // The buffer is filled in this way:
81   // - Append all the strings as we iterate through the results. The rationale
82   //   is that strings are typically the largest part of the result and we want
83   //   to avoid copying these.
84   // - While iterating, buffer all other types of cells. They will be appended
85   //   at the end of the batch, after the string payload is known.
86 
87   // Note: this function uses uint32_t instead of size_t because Wasm doesn't
88   // have yet native 64-bit integers and this is perf-sensitive.
89 
90   const auto& writer = *res->stream_writer();
91   auto* batch = res->add_batch();
92 
93   // Start the |string_cells|.
94   auto* strings = batch->BeginNestedMessage<protozero::Message>(
95       BatchProto::kStringCellsFieldNumber);
96 
97   // This keeps track of the overall size of the batch. It is used to decide if
98   // we need to prematurely end the batch, even if the batch_split_threshold_ is
99   // not reached. This is to guard against the degenerate case of appending a
100   // lot of very large strings and ending up with an enormous batch.
101   uint32_t approx_batch_size = 16;
102 
103   std::vector<uint8_t> cell_types(cells_per_batch_);
104 
105   // Varints and doubles are written on stack-based storage and appended later.
106   protozero::PackedVarInt varints;
107   protozero::PackedFixedSizeInt<double> doubles;
108 
109   // We write blobs on a temporary heap buffer and append it at the end. Blobs
110   // are extremely rare, trying to avoid copies is not worth the complexity.
111   std::vector<uint8_t> blobs;
112 
113   uint32_t cell_idx = 0;
114   bool batch_full = false;
115 
116   for (;; ++cell_idx, ++col_) {
117     // This branch is hit before starting each row. Note that iter_->Next() must
118     // be called before iterating on a row. col_ is initialized at MAX_INT in
119     // the constructor.
120     if (col_ >= num_cols_) {
121       col_ = 0;
122       // If num_cols_ == 0 and the query didn't return any result (e.g. CREATE
123       // TABLE) we should exit at this point. We still need to advance the
124       // iterator via Next() otherwise the statement will have no effect.
125       if (!iter_->Next())
126         break;  // EOF or error.
127 
128       PERFETTO_DCHECK(num_cols_ > 0);
129       // We need to guarantee that a batch contains whole rows. Before moving to
130       // the next row, make sure that: (i) there is space for all the columns;
131       // (ii) the batch didn't grow too much.
132       if (cell_idx + num_cols_ > cells_per_batch_ ||
133           approx_batch_size > batch_split_threshold_) {
134         batch_full = true;
135         break;
136       }
137     }
138 
139     auto value = iter_->Get(col_);
140     uint8_t cell_type = BatchProto::CELL_INVALID;
141     switch (value.type) {
142       case SqlValue::Type::kNull: {
143         cell_type = BatchProto::CELL_NULL;
144         break;
145       }
146       case SqlValue::Type::kLong: {
147         cell_type = BatchProto::CELL_VARINT;
148         varints.Append(value.long_value);
149         approx_batch_size += 4;  // Just a guess, doesn't need to be accurate.
150         break;
151       }
152       case SqlValue::Type::kDouble: {
153         cell_type = BatchProto::CELL_FLOAT64;
154         approx_batch_size += sizeof(double);
155         doubles.Append(value.double_value);
156         break;
157       }
158       case SqlValue::Type::kString: {
159         // Append the string to the one |string_cells| proto field, just use
160         // \0 to separate each string. We are deliberately NOT emitting one
161         // proto repeated field for each string. Doing so significantly slows
162         // down parsing on the JS side (go/postmessage-benchmark).
163         cell_type = BatchProto::CELL_STRING;
164         uint32_t len_with_nul =
165             static_cast<uint32_t>(strlen(value.string_value)) + 1;
166         const char* str_begin = value.string_value;
167         strings->AppendRawProtoBytes(str_begin, len_with_nul);
168         approx_batch_size += len_with_nul + 4;  // 4 is a guess on the preamble.
169         break;
170       }
171       case SqlValue::Type::kBytes: {
172         // Each blob is stored as its own repeated proto field, unlike strings.
173         // Blobs don't incur in text-decoding overhead (and are also rare).
174         cell_type = BatchProto::CELL_BLOB;
175         auto* src = static_cast<const uint8_t*>(value.bytes_value);
176         uint32_t len = static_cast<uint32_t>(value.bytes_count);
177         uint8_t preamble[16];
178         uint8_t* preamble_end = &preamble[0];
179         *(preamble_end++) = MakeLenDelimTag(BatchProto::kBlobCellsFieldNumber);
180         preamble_end = pu::WriteVarInt(len, preamble_end);
181         blobs.insert(blobs.end(), preamble, preamble_end);
182         blobs.insert(blobs.end(), src, src + len);
183         approx_batch_size += len + 4;  // 4 is a guess on the preamble size.
184         break;
185       }
186     }
187 
188     PERFETTO_DCHECK(cell_type != BatchProto::CELL_INVALID);
189     cell_types[cell_idx] = cell_type;
190   }  // for (cell)
191 
192   // Backfill the string size.
193   strings->Finalize();
194   strings = nullptr;
195 
196   // Write the cells headers (1 byte per cell).
197   batch->AppendBytes(BatchProto::kCellsFieldNumber, cell_types.data(),
198                      cell_idx);
199 
200   // Append the |varint_cells|, copying over the packed varint buffer.
201   if (varints.size())
202     batch->set_varint_cells(varints);
203 
204   // Append the |float64_cells|, copying over the packed fixed64 buffer. This is
205   // appended at a 64-bit aligned offset, so that JS can access these by overlay
206   // a TypedArray, without extra copies.
207   const uint32_t doubles_size = static_cast<uint32_t>(doubles.size());
208   if (doubles_size > 0) {
209     uint8_t preamble[16];
210     uint8_t* preamble_end = &preamble[0];
211     *(preamble_end++) = MakeLenDelimTag(BatchProto::kFloat64CellsFieldNumber);
212     preamble_end = pu::WriteVarInt(doubles_size, preamble_end);
213     uint32_t preamble_size = static_cast<uint32_t>(preamble_end - &preamble[0]);
214 
215     // The byte after the preamble must start at a 64bit-aligned offset.
216     // The padding needs to be > 1 Byte because of proto encoding.
217     const uint32_t off =
218         static_cast<uint32_t>(writer.written() + preamble_size);
219     const uint32_t aligned_off = (off + 7) & ~7u;
220     uint32_t padding = aligned_off - off;
221     padding = padding == 1 ? 9 : padding;
222     if (padding > 0) {
223       uint8_t pad_buf[10];
224       uint8_t* pad = pad_buf;
225       *(pad++) = pu::MakeTagVarInt(kPaddingFieldId);
226       for (uint32_t i = 0; i < padding - 2; i++)
227         *(pad++) = 0x80;
228       *(pad++) = 0;
229       batch->AppendRawProtoBytes(pad_buf, static_cast<size_t>(pad - pad_buf));
230     }
231     batch->AppendRawProtoBytes(preamble, preamble_size);
232     PERFETTO_CHECK(writer.written() % 8 == 0);
233     batch->AppendRawProtoBytes(doubles.data(), doubles_size);
234   }  // if (doubles_size > 0)
235 
236   // Append the blobs.
237   batch->AppendRawProtoBytes(blobs.data(), blobs.size());
238 
239   // If this is the last batch, write the EOF field.
240   if (!batch_full) {
241     eof_reached_ = true;
242     batch->set_is_last_batch(true);
243   }
244 
245   // Finally backfill the size of the whole |batch| sub-message.
246   batch->Finalize();
247 }
248 
MaybeSerializeError(protos::pbzero::QueryResult * res)249 void QueryResultSerializer::MaybeSerializeError(
250     protos::pbzero::QueryResult* res) {
251   if (iter_->Status().ok())
252     return;
253   std::string err = iter_->Status().message();
254   // Make sure the |error| field is always non-zero if the query failed, so
255   // the client can tell some error happened.
256   if (err.empty())
257     err = "Unknown error";
258   res->set_error(err);
259 }
260 
SerializeColumnNames(protos::pbzero::QueryResult * res)261 void QueryResultSerializer::SerializeColumnNames(
262     protos::pbzero::QueryResult* res) {
263   PERFETTO_DCHECK(!did_write_column_names_);
264   for (uint32_t c = 0; c < num_cols_; c++)
265     res->add_column_names(iter_->GetColumnName(c));
266 }
267 
268 }  // namespace trace_processor
269 }  // namespace perfetto
270