1 // Protocol Buffers - Google's data interchange format
2 // Copyright 2008 Google Inc. All rights reserved.
3 // https://developers.google.com/protocol-buffers/
4 //
5 // Redistribution and use in source and binary forms, with or without
6 // modification, are permitted provided that the following conditions are
7 // met:
8 //
9 // * Redistributions of source code must retain the above copyright
10 // notice, this list of conditions and the following disclaimer.
11 // * Redistributions in binary form must reproduce the above
12 // copyright notice, this list of conditions and the following disclaimer
13 // in the documentation and/or other materials provided with the
14 // distribution.
15 // * Neither the name of Google Inc. nor the names of its
16 // contributors may be used to endorse or promote products derived from
17 // this software without specific prior written permission.
18 //
19 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
20 // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
21 // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
22 // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
23 // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
24 // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
25 // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
26 // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
27 // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
28 // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
29 // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
30
31 // Author: jschorr@google.com (Joseph Schorr)
32 // Based on original Protocol Buffers design by
33 // Sanjay Ghemawat, Jeff Dean, and others.
34
35 #include <algorithm>
36 #include <float.h>
37 #include <math.h>
38 #include <stdio.h>
39 #include <stack>
40 #include <limits>
41 #include <vector>
42
43 #include <google/protobuf/text_format.h>
44
45 #include <google/protobuf/descriptor.h>
46 #include <google/protobuf/dynamic_message.h>
47 #include <google/protobuf/repeated_field.h>
48 #include <google/protobuf/wire_format_lite.h>
49 #include <google/protobuf/io/strtod.h>
50 #include <google/protobuf/io/coded_stream.h>
51 #include <google/protobuf/io/zero_copy_stream.h>
52 #include <google/protobuf/io/zero_copy_stream_impl.h>
53 #include <google/protobuf/unknown_field_set.h>
54 #include <google/protobuf/descriptor.pb.h>
55 #include <google/protobuf/io/tokenizer.h>
56 #include <google/protobuf/any.h>
57 #include <google/protobuf/stubs/stringprintf.h>
58 #include <google/protobuf/stubs/strutil.h>
59 #include <google/protobuf/stubs/map_util.h>
60 #include <google/protobuf/stubs/stl_util.h>
61
62 namespace google {
63 namespace protobuf {
64
65 namespace {
66
IsHexNumber(const string & str)67 inline bool IsHexNumber(const string& str) {
68 return (str.length() >= 2 && str[0] == '0' &&
69 (str[1] == 'x' || str[1] == 'X'));
70 }
71
IsOctNumber(const string & str)72 inline bool IsOctNumber(const string& str) {
73 return (str.length() >= 2 && str[0] == '0' &&
74 (str[1] >= '0' && str[1] < '8'));
75 }
76
GetAnyFieldDescriptors(const Message & message,const FieldDescriptor ** type_url_field,const FieldDescriptor ** value_field)77 inline bool GetAnyFieldDescriptors(const Message& message,
78 const FieldDescriptor** type_url_field,
79 const FieldDescriptor** value_field) {
80 const Descriptor* descriptor = message.GetDescriptor();
81 *type_url_field = descriptor->FindFieldByNumber(1);
82 *value_field = descriptor->FindFieldByNumber(2);
83 return (*type_url_field != NULL &&
84 (*type_url_field)->type() == FieldDescriptor::TYPE_STRING &&
85 *value_field != NULL &&
86 (*value_field)->type() == FieldDescriptor::TYPE_BYTES);
87 }
88
89 } // namespace
90
DebugString() const91 string Message::DebugString() const {
92 string debug_string;
93
94 TextFormat::Printer printer;
95 printer.SetExpandAny(true);
96
97 printer.PrintToString(*this, &debug_string);
98
99 return debug_string;
100 }
101
ShortDebugString() const102 string Message::ShortDebugString() const {
103 string debug_string;
104
105 TextFormat::Printer printer;
106 printer.SetSingleLineMode(true);
107 printer.SetExpandAny(true);
108
109 printer.PrintToString(*this, &debug_string);
110 // Single line mode currently might have an extra space at the end.
111 if (debug_string.size() > 0 &&
112 debug_string[debug_string.size() - 1] == ' ') {
113 debug_string.resize(debug_string.size() - 1);
114 }
115
116 return debug_string;
117 }
118
Utf8DebugString() const119 string Message::Utf8DebugString() const {
120 string debug_string;
121
122 TextFormat::Printer printer;
123 printer.SetUseUtf8StringEscaping(true);
124 printer.SetExpandAny(true);
125
126 printer.PrintToString(*this, &debug_string);
127
128 return debug_string;
129 }
130
PrintDebugString() const131 void Message::PrintDebugString() const {
132 printf("%s", DebugString().c_str());
133 }
134
135
136 // ===========================================================================
137 // Implementation of the parse information tree class.
ParseInfoTree()138 TextFormat::ParseInfoTree::ParseInfoTree() { }
139
~ParseInfoTree()140 TextFormat::ParseInfoTree::~ParseInfoTree() {
141 // Remove any nested information trees, as they are owned by this tree.
142 for (NestedMap::iterator it = nested_.begin(); it != nested_.end(); ++it) {
143 STLDeleteElements(&(it->second));
144 }
145 }
146
RecordLocation(const FieldDescriptor * field,TextFormat::ParseLocation location)147 void TextFormat::ParseInfoTree::RecordLocation(
148 const FieldDescriptor* field,
149 TextFormat::ParseLocation location) {
150 locations_[field].push_back(location);
151 }
152
CreateNested(const FieldDescriptor * field)153 TextFormat::ParseInfoTree* TextFormat::ParseInfoTree::CreateNested(
154 const FieldDescriptor* field) {
155 // Owned by us in the map.
156 TextFormat::ParseInfoTree* instance = new TextFormat::ParseInfoTree();
157 vector<TextFormat::ParseInfoTree*>* trees = &nested_[field];
158 GOOGLE_CHECK(trees);
159 trees->push_back(instance);
160 return instance;
161 }
162
CheckFieldIndex(const FieldDescriptor * field,int index)163 void CheckFieldIndex(const FieldDescriptor* field, int index) {
164 if (field == NULL) { return; }
165
166 if (field->is_repeated() && index == -1) {
167 GOOGLE_LOG(DFATAL) << "Index must be in range of repeated field values. "
168 << "Field: " << field->name();
169 } else if (!field->is_repeated() && index != -1) {
170 GOOGLE_LOG(DFATAL) << "Index must be -1 for singular fields."
171 << "Field: " << field->name();
172 }
173 }
174
GetLocation(const FieldDescriptor * field,int index) const175 TextFormat::ParseLocation TextFormat::ParseInfoTree::GetLocation(
176 const FieldDescriptor* field, int index) const {
177 CheckFieldIndex(field, index);
178 if (index == -1) { index = 0; }
179
180 const vector<TextFormat::ParseLocation>* locations =
181 FindOrNull(locations_, field);
182 if (locations == NULL || index >= locations->size()) {
183 return TextFormat::ParseLocation();
184 }
185
186 return (*locations)[index];
187 }
188
GetTreeForNested(const FieldDescriptor * field,int index) const189 TextFormat::ParseInfoTree* TextFormat::ParseInfoTree::GetTreeForNested(
190 const FieldDescriptor* field, int index) const {
191 CheckFieldIndex(field, index);
192 if (index == -1) { index = 0; }
193
194 const vector<TextFormat::ParseInfoTree*>* trees = FindOrNull(nested_, field);
195 if (trees == NULL || index >= trees->size()) {
196 return NULL;
197 }
198
199 return (*trees)[index];
200 }
201
202
203 // ===========================================================================
204 // Internal class for parsing an ASCII representation of a Protocol Message.
205 // This class makes use of the Protocol Message compiler's tokenizer found
206 // in //google/protobuf/io/tokenizer.h. Note that class's Parse
207 // method is *not* thread-safe and should only be used in a single thread at
208 // a time.
209
210 // Makes code slightly more readable. The meaning of "DO(foo)" is
211 // "Execute foo and fail if it fails.", where failure is indicated by
212 // returning false. Borrowed from parser.cc (Thanks Kenton!).
213 #define DO(STATEMENT) if (STATEMENT) {} else return false
214
215 class TextFormat::Parser::ParserImpl {
216 public:
217
218 // Determines if repeated values for non-repeated fields and
219 // oneofs are permitted, e.g., the string "foo: 1 foo: 2" for a
220 // required/optional field named "foo", or "baz: 1 qux: 2"
221 // where "baz" and "qux" are members of the same oneof.
222 enum SingularOverwritePolicy {
223 ALLOW_SINGULAR_OVERWRITES = 0, // the last value is retained
224 FORBID_SINGULAR_OVERWRITES = 1, // an error is issued
225 };
226
ParserImpl(const Descriptor * root_message_type,io::ZeroCopyInputStream * input_stream,io::ErrorCollector * error_collector,TextFormat::Finder * finder,ParseInfoTree * parse_info_tree,SingularOverwritePolicy singular_overwrite_policy,bool allow_case_insensitive_field,bool allow_unknown_field,bool allow_unknown_enum,bool allow_field_number,bool allow_relaxed_whitespace,bool allow_partial)227 ParserImpl(const Descriptor* root_message_type,
228 io::ZeroCopyInputStream* input_stream,
229 io::ErrorCollector* error_collector,
230 TextFormat::Finder* finder,
231 ParseInfoTree* parse_info_tree,
232 SingularOverwritePolicy singular_overwrite_policy,
233 bool allow_case_insensitive_field,
234 bool allow_unknown_field,
235 bool allow_unknown_enum,
236 bool allow_field_number,
237 bool allow_relaxed_whitespace,
238 bool allow_partial)
239 : error_collector_(error_collector),
240 finder_(finder),
241 parse_info_tree_(parse_info_tree),
242 tokenizer_error_collector_(this),
243 tokenizer_(input_stream, &tokenizer_error_collector_),
244 root_message_type_(root_message_type),
245 singular_overwrite_policy_(singular_overwrite_policy),
246 allow_case_insensitive_field_(allow_case_insensitive_field),
247 allow_unknown_field_(allow_unknown_field),
248 allow_unknown_enum_(allow_unknown_enum),
249 allow_field_number_(allow_field_number),
250 allow_partial_(allow_partial),
251 had_errors_(false) {
252 // For backwards-compatibility with proto1, we need to allow the 'f' suffix
253 // for floats.
254 tokenizer_.set_allow_f_after_float(true);
255
256 // '#' starts a comment.
257 tokenizer_.set_comment_style(io::Tokenizer::SH_COMMENT_STYLE);
258
259 if (allow_relaxed_whitespace) {
260 tokenizer_.set_require_space_after_number(false);
261 tokenizer_.set_allow_multiline_strings(true);
262 }
263
264 // Consume the starting token.
265 tokenizer_.Next();
266 }
~ParserImpl()267 ~ParserImpl() { }
268
269 // Parses the ASCII representation specified in input and saves the
270 // information into the output pointer (a Message). Returns
271 // false if an error occurs (an error will also be logged to
272 // GOOGLE_LOG(ERROR)).
Parse(Message * output)273 bool Parse(Message* output) {
274 // Consume fields until we cannot do so anymore.
275 while (true) {
276 if (LookingAtType(io::Tokenizer::TYPE_END)) {
277 return !had_errors_;
278 }
279
280 DO(ConsumeField(output));
281 }
282 }
283
ParseField(const FieldDescriptor * field,Message * output)284 bool ParseField(const FieldDescriptor* field, Message* output) {
285 bool suc;
286 if (field->cpp_type() == FieldDescriptor::CPPTYPE_MESSAGE) {
287 suc = ConsumeFieldMessage(output, output->GetReflection(), field);
288 } else {
289 suc = ConsumeFieldValue(output, output->GetReflection(), field);
290 }
291 return suc && LookingAtType(io::Tokenizer::TYPE_END);
292 }
293
ReportError(int line,int col,const string & message)294 void ReportError(int line, int col, const string& message) {
295 had_errors_ = true;
296 if (error_collector_ == NULL) {
297 if (line >= 0) {
298 GOOGLE_LOG(ERROR) << "Error parsing text-format "
299 << root_message_type_->full_name()
300 << ": " << (line + 1) << ":"
301 << (col + 1) << ": " << message;
302 } else {
303 GOOGLE_LOG(ERROR) << "Error parsing text-format "
304 << root_message_type_->full_name()
305 << ": " << message;
306 }
307 } else {
308 error_collector_->AddError(line, col, message);
309 }
310 }
311
ReportWarning(int line,int col,const string & message)312 void ReportWarning(int line, int col, const string& message) {
313 if (error_collector_ == NULL) {
314 if (line >= 0) {
315 GOOGLE_LOG(WARNING) << "Warning parsing text-format "
316 << root_message_type_->full_name()
317 << ": " << (line + 1) << ":"
318 << (col + 1) << ": " << message;
319 } else {
320 GOOGLE_LOG(WARNING) << "Warning parsing text-format "
321 << root_message_type_->full_name()
322 << ": " << message;
323 }
324 } else {
325 error_collector_->AddWarning(line, col, message);
326 }
327 }
328
329 private:
330 GOOGLE_DISALLOW_EVIL_CONSTRUCTORS(ParserImpl);
331
332 // Reports an error with the given message with information indicating
333 // the position (as derived from the current token).
ReportError(const string & message)334 void ReportError(const string& message) {
335 ReportError(tokenizer_.current().line, tokenizer_.current().column,
336 message);
337 }
338
339 // Reports a warning with the given message with information indicating
340 // the position (as derived from the current token).
ReportWarning(const string & message)341 void ReportWarning(const string& message) {
342 ReportWarning(tokenizer_.current().line, tokenizer_.current().column,
343 message);
344 }
345
346 // Consumes the specified message with the given starting delimiter.
347 // This method checks to see that the end delimiter at the conclusion of
348 // the consumption matches the starting delimiter passed in here.
ConsumeMessage(Message * message,const string delimiter)349 bool ConsumeMessage(Message* message, const string delimiter) {
350 while (!LookingAt(">") && !LookingAt("}")) {
351 DO(ConsumeField(message));
352 }
353
354 // Confirm that we have a valid ending delimiter.
355 DO(Consume(delimiter));
356 return true;
357 }
358
359 // Consume either "<" or "{".
ConsumeMessageDelimiter(string * delimiter)360 bool ConsumeMessageDelimiter(string* delimiter) {
361 if (TryConsume("<")) {
362 *delimiter = ">";
363 } else {
364 DO(Consume("{"));
365 *delimiter = "}";
366 }
367 return true;
368 }
369
370
371 // Consumes the current field (as returned by the tokenizer) on the
372 // passed in message.
ConsumeField(Message * message)373 bool ConsumeField(Message* message) {
374 const Reflection* reflection = message->GetReflection();
375 const Descriptor* descriptor = message->GetDescriptor();
376
377 string field_name;
378
379 const FieldDescriptor* field = NULL;
380 int start_line = tokenizer_.current().line;
381 int start_column = tokenizer_.current().column;
382
383 const FieldDescriptor* any_type_url_field;
384 const FieldDescriptor* any_value_field;
385 if (internal::GetAnyFieldDescriptors(*message, &any_type_url_field,
386 &any_value_field) &&
387 TryConsume("[")) {
388 string full_type_name, prefix;
389 DO(ConsumeAnyTypeUrl(&full_type_name, &prefix));
390 DO(Consume("]"));
391 TryConsume(":"); // ':' is optional between message labels and values.
392 string serialized_value;
393 DO(ConsumeAnyValue(full_type_name,
394 message->GetDescriptor()->file()->pool(),
395 &serialized_value));
396 reflection->SetString(
397 message, any_type_url_field,
398 string(prefix + full_type_name));
399 reflection->SetString(message, any_value_field, serialized_value);
400 return true;
401 }
402 if (TryConsume("[")) {
403 // Extension.
404 DO(ConsumeFullTypeName(&field_name));
405 DO(Consume("]"));
406
407 field = (finder_ != NULL
408 ? finder_->FindExtension(message, field_name)
409 : reflection->FindKnownExtensionByName(field_name));
410
411 if (field == NULL) {
412 if (!allow_unknown_field_) {
413 ReportError("Extension \"" + field_name + "\" is not defined or "
414 "is not an extension of \"" +
415 descriptor->full_name() + "\".");
416 return false;
417 } else {
418 ReportWarning("Extension \"" + field_name + "\" is not defined or "
419 "is not an extension of \"" +
420 descriptor->full_name() + "\".");
421 }
422 }
423 } else {
424 DO(ConsumeIdentifier(&field_name));
425
426 int32 field_number;
427 if (allow_field_number_ && safe_strto32(field_name, &field_number)) {
428 if (descriptor->IsExtensionNumber(field_number)) {
429 field = reflection->FindKnownExtensionByNumber(field_number);
430 } else {
431 field = descriptor->FindFieldByNumber(field_number);
432 }
433 } else {
434 field = descriptor->FindFieldByName(field_name);
435 // Group names are expected to be capitalized as they appear in the
436 // .proto file, which actually matches their type names, not their
437 // field names.
438 if (field == NULL) {
439 string lower_field_name = field_name;
440 LowerString(&lower_field_name);
441 field = descriptor->FindFieldByName(lower_field_name);
442 // If the case-insensitive match worked but the field is NOT a group,
443 if (field != NULL && field->type() != FieldDescriptor::TYPE_GROUP) {
444 field = NULL;
445 }
446 }
447 // Again, special-case group names as described above.
448 if (field != NULL && field->type() == FieldDescriptor::TYPE_GROUP
449 && field->message_type()->name() != field_name) {
450 field = NULL;
451 }
452
453 if (field == NULL && allow_case_insensitive_field_) {
454 string lower_field_name = field_name;
455 LowerString(&lower_field_name);
456 field = descriptor->FindFieldByLowercaseName(lower_field_name);
457 }
458 }
459
460 if (field == NULL) {
461 if (!allow_unknown_field_) {
462 ReportError("Message type \"" + descriptor->full_name() +
463 "\" has no field named \"" + field_name + "\".");
464 return false;
465 } else {
466 ReportWarning("Message type \"" + descriptor->full_name() +
467 "\" has no field named \"" + field_name + "\".");
468 }
469 }
470 }
471
472 // Skips unknown field.
473 if (field == NULL) {
474 GOOGLE_CHECK(allow_unknown_field_);
475 // Try to guess the type of this field.
476 // If this field is not a message, there should be a ":" between the
477 // field name and the field value and also the field value should not
478 // start with "{" or "<" which indicates the beginning of a message body.
479 // If there is no ":" or there is a "{" or "<" after ":", this field has
480 // to be a message or the input is ill-formed.
481 if (TryConsume(":") && !LookingAt("{") && !LookingAt("<")) {
482 return SkipFieldValue();
483 } else {
484 return SkipFieldMessage();
485 }
486 }
487
488 if (singular_overwrite_policy_ == FORBID_SINGULAR_OVERWRITES) {
489 // Fail if the field is not repeated and it has already been specified.
490 if (!field->is_repeated() && reflection->HasField(*message, field)) {
491 ReportError("Non-repeated field \"" + field_name +
492 "\" is specified multiple times.");
493 return false;
494 }
495 // Fail if the field is a member of a oneof and another member has already
496 // been specified.
497 const OneofDescriptor* oneof = field->containing_oneof();
498 if (oneof != NULL && reflection->HasOneof(*message, oneof)) {
499 const FieldDescriptor* other_field =
500 reflection->GetOneofFieldDescriptor(*message, oneof);
501 ReportError("Field \"" + field_name + "\" is specified along with "
502 "field \"" + other_field->name() + "\", another member "
503 "of oneof \"" + oneof->name() + "\".");
504 return false;
505 }
506 }
507
508 // Perform special handling for embedded message types.
509 if (field->cpp_type() == FieldDescriptor::CPPTYPE_MESSAGE) {
510 // ':' is optional here.
511 TryConsume(":");
512 } else {
513 // ':' is required here.
514 DO(Consume(":"));
515 }
516
517 if (field->is_repeated() && TryConsume("[")) {
518 // Short repeated format, e.g. "foo: [1, 2, 3]"
519 while (true) {
520 if (field->cpp_type() == FieldDescriptor::CPPTYPE_MESSAGE) {
521 // Perform special handling for embedded message types.
522 DO(ConsumeFieldMessage(message, reflection, field));
523 } else {
524 DO(ConsumeFieldValue(message, reflection, field));
525 }
526 if (TryConsume("]")) {
527 break;
528 }
529 DO(Consume(","));
530 }
531 } else if (field->cpp_type() == FieldDescriptor::CPPTYPE_MESSAGE) {
532 DO(ConsumeFieldMessage(message, reflection, field));
533 } else {
534 DO(ConsumeFieldValue(message, reflection, field));
535 }
536
537 // For historical reasons, fields may optionally be separated by commas or
538 // semicolons.
539 TryConsume(";") || TryConsume(",");
540
541 if (field->options().deprecated()) {
542 ReportWarning("text format contains deprecated field \""
543 + field_name + "\"");
544 }
545
546 // If a parse info tree exists, add the location for the parsed
547 // field.
548 if (parse_info_tree_ != NULL) {
549 RecordLocation(parse_info_tree_, field,
550 ParseLocation(start_line, start_column));
551 }
552
553 return true;
554 }
555
556 // Skips the next field including the field's name and value.
SkipField()557 bool SkipField() {
558 string field_name;
559 if (TryConsume("[")) {
560 // Extension name.
561 DO(ConsumeFullTypeName(&field_name));
562 DO(Consume("]"));
563 } else {
564 DO(ConsumeIdentifier(&field_name));
565 }
566
567 // Try to guess the type of this field.
568 // If this field is not a message, there should be a ":" between the
569 // field name and the field value and also the field value should not
570 // start with "{" or "<" which indicates the beginning of a message body.
571 // If there is no ":" or there is a "{" or "<" after ":", this field has
572 // to be a message or the input is ill-formed.
573 if (TryConsume(":") && !LookingAt("{") && !LookingAt("<")) {
574 DO(SkipFieldValue());
575 } else {
576 DO(SkipFieldMessage());
577 }
578 // For historical reasons, fields may optionally be separated by commas or
579 // semicolons.
580 TryConsume(";") || TryConsume(",");
581 return true;
582 }
583
ConsumeFieldMessage(Message * message,const Reflection * reflection,const FieldDescriptor * field)584 bool ConsumeFieldMessage(Message* message,
585 const Reflection* reflection,
586 const FieldDescriptor* field) {
587
588 // If the parse information tree is not NULL, create a nested one
589 // for the nested message.
590 ParseInfoTree* parent = parse_info_tree_;
591 if (parent != NULL) {
592 parse_info_tree_ = CreateNested(parent, field);
593 }
594
595 string delimiter;
596 DO(ConsumeMessageDelimiter(&delimiter));
597 if (field->is_repeated()) {
598 DO(ConsumeMessage(reflection->AddMessage(message, field), delimiter));
599 } else {
600 DO(ConsumeMessage(reflection->MutableMessage(message, field),
601 delimiter));
602 }
603
604 // Reset the parse information tree.
605 parse_info_tree_ = parent;
606 return true;
607 }
608
609 // Skips the whole body of a message including the beginning delimiter and
610 // the ending delimiter.
SkipFieldMessage()611 bool SkipFieldMessage() {
612 string delimiter;
613 DO(ConsumeMessageDelimiter(&delimiter));
614 while (!LookingAt(">") && !LookingAt("}")) {
615 DO(SkipField());
616 }
617 DO(Consume(delimiter));
618 return true;
619 }
620
ConsumeFieldValue(Message * message,const Reflection * reflection,const FieldDescriptor * field)621 bool ConsumeFieldValue(Message* message,
622 const Reflection* reflection,
623 const FieldDescriptor* field) {
624
625 // Define an easy to use macro for setting fields. This macro checks
626 // to see if the field is repeated (in which case we need to use the Add
627 // methods or not (in which case we need to use the Set methods).
628 #define SET_FIELD(CPPTYPE, VALUE) \
629 if (field->is_repeated()) { \
630 reflection->Add##CPPTYPE(message, field, VALUE); \
631 } else { \
632 reflection->Set##CPPTYPE(message, field, VALUE); \
633 } \
634
635 switch(field->cpp_type()) {
636 case FieldDescriptor::CPPTYPE_INT32: {
637 int64 value;
638 DO(ConsumeSignedInteger(&value, kint32max));
639 SET_FIELD(Int32, static_cast<int32>(value));
640 break;
641 }
642
643 case FieldDescriptor::CPPTYPE_UINT32: {
644 uint64 value;
645 DO(ConsumeUnsignedInteger(&value, kuint32max));
646 SET_FIELD(UInt32, static_cast<uint32>(value));
647 break;
648 }
649
650 case FieldDescriptor::CPPTYPE_INT64: {
651 int64 value;
652 DO(ConsumeSignedInteger(&value, kint64max));
653 SET_FIELD(Int64, value);
654 break;
655 }
656
657 case FieldDescriptor::CPPTYPE_UINT64: {
658 uint64 value;
659 DO(ConsumeUnsignedInteger(&value, kuint64max));
660 SET_FIELD(UInt64, value);
661 break;
662 }
663
664 case FieldDescriptor::CPPTYPE_FLOAT: {
665 double value;
666 DO(ConsumeDouble(&value));
667 SET_FIELD(Float, io::SafeDoubleToFloat(value));
668 break;
669 }
670
671 case FieldDescriptor::CPPTYPE_DOUBLE: {
672 double value;
673 DO(ConsumeDouble(&value));
674 SET_FIELD(Double, value);
675 break;
676 }
677
678 case FieldDescriptor::CPPTYPE_STRING: {
679 string value;
680 DO(ConsumeString(&value));
681 SET_FIELD(String, value);
682 break;
683 }
684
685 case FieldDescriptor::CPPTYPE_BOOL: {
686 if (LookingAtType(io::Tokenizer::TYPE_INTEGER)) {
687 uint64 value;
688 DO(ConsumeUnsignedInteger(&value, 1));
689 SET_FIELD(Bool, value);
690 } else {
691 string value;
692 DO(ConsumeIdentifier(&value));
693 if (value == "true" || value == "True" || value == "t") {
694 SET_FIELD(Bool, true);
695 } else if (value == "false" || value == "False" || value == "f") {
696 SET_FIELD(Bool, false);
697 } else {
698 ReportError("Invalid value for boolean field \"" + field->name()
699 + "\". Value: \"" + value + "\".");
700 return false;
701 }
702 }
703 break;
704 }
705
706 case FieldDescriptor::CPPTYPE_ENUM: {
707 string value;
708 const EnumDescriptor* enum_type = field->enum_type();
709 const EnumValueDescriptor* enum_value = NULL;
710
711 if (LookingAtType(io::Tokenizer::TYPE_IDENTIFIER)) {
712 DO(ConsumeIdentifier(&value));
713 // Find the enumeration value.
714 enum_value = enum_type->FindValueByName(value);
715
716 } else if (LookingAt("-") ||
717 LookingAtType(io::Tokenizer::TYPE_INTEGER)) {
718 int64 int_value;
719 DO(ConsumeSignedInteger(&int_value, kint32max));
720 value = SimpleItoa(int_value); // for error reporting
721 enum_value = enum_type->FindValueByNumber(int_value);
722 } else {
723 ReportError("Expected integer or identifier, got: " +
724 tokenizer_.current().text);
725 return false;
726 }
727
728 if (enum_value == NULL) {
729 if (!allow_unknown_enum_) {
730 ReportError("Unknown enumeration value of \"" + value + "\" for "
731 "field \"" + field->name() + "\".");
732 return false;
733 } else {
734 ReportWarning("Unknown enumeration value of \"" + value + "\" for "
735 "field \"" + field->name() + "\".");
736 return true;
737 }
738 }
739
740 SET_FIELD(Enum, enum_value);
741 break;
742 }
743
744 case FieldDescriptor::CPPTYPE_MESSAGE: {
745 // We should never get here. Put here instead of a default
746 // so that if new types are added, we get a nice compiler warning.
747 GOOGLE_LOG(FATAL) << "Reached an unintended state: CPPTYPE_MESSAGE";
748 break;
749 }
750 }
751 #undef SET_FIELD
752 return true;
753 }
754
SkipFieldValue()755 bool SkipFieldValue() {
756 if (LookingAtType(io::Tokenizer::TYPE_STRING)) {
757 while (LookingAtType(io::Tokenizer::TYPE_STRING)) {
758 tokenizer_.Next();
759 }
760 return true;
761 }
762 if (TryConsume("[")) {
763 while (true) {
764 if (!LookingAt("{") && !LookingAt("<")) {
765 DO(SkipFieldValue());
766 } else {
767 DO(SkipFieldMessage());
768 }
769 if (TryConsume("]")) {
770 break;
771 }
772 DO(Consume(","));
773 }
774 return true;
775 }
776 // Possible field values other than string:
777 // 12345 => TYPE_INTEGER
778 // -12345 => TYPE_SYMBOL + TYPE_INTEGER
779 // 1.2345 => TYPE_FLOAT
780 // -1.2345 => TYPE_SYMBOL + TYPE_FLOAT
781 // inf => TYPE_IDENTIFIER
782 // -inf => TYPE_SYMBOL + TYPE_IDENTIFIER
783 // TYPE_INTEGER => TYPE_IDENTIFIER
784 // Divides them into two group, one with TYPE_SYMBOL
785 // and the other without:
786 // Group one:
787 // 12345 => TYPE_INTEGER
788 // 1.2345 => TYPE_FLOAT
789 // inf => TYPE_IDENTIFIER
790 // TYPE_INTEGER => TYPE_IDENTIFIER
791 // Group two:
792 // -12345 => TYPE_SYMBOL + TYPE_INTEGER
793 // -1.2345 => TYPE_SYMBOL + TYPE_FLOAT
794 // -inf => TYPE_SYMBOL + TYPE_IDENTIFIER
795 // As we can see, the field value consists of an optional '-' and one of
796 // TYPE_INTEGER, TYPE_FLOAT and TYPE_IDENTIFIER.
797 bool has_minus = TryConsume("-");
798 if (!LookingAtType(io::Tokenizer::TYPE_INTEGER) &&
799 !LookingAtType(io::Tokenizer::TYPE_FLOAT) &&
800 !LookingAtType(io::Tokenizer::TYPE_IDENTIFIER)) {
801 return false;
802 }
803 // Combination of '-' and TYPE_IDENTIFIER may result in an invalid field
804 // value while other combinations all generate valid values.
805 // We check if the value of this combination is valid here.
806 // TYPE_IDENTIFIER after a '-' should be one of the float values listed
807 // below:
808 // inf, inff, infinity, nan
809 if (has_minus && LookingAtType(io::Tokenizer::TYPE_IDENTIFIER)) {
810 string text = tokenizer_.current().text;
811 LowerString(&text);
812 if (text != "inf" &&
813 text != "infinity" &&
814 text != "nan") {
815 ReportError("Invalid float number: " + text);
816 return false;
817 }
818 }
819 tokenizer_.Next();
820 return true;
821 }
822
823 // Returns true if the current token's text is equal to that specified.
LookingAt(const string & text)824 bool LookingAt(const string& text) {
825 return tokenizer_.current().text == text;
826 }
827
828 // Returns true if the current token's type is equal to that specified.
LookingAtType(io::Tokenizer::TokenType token_type)829 bool LookingAtType(io::Tokenizer::TokenType token_type) {
830 return tokenizer_.current().type == token_type;
831 }
832
833 // Consumes an identifier and saves its value in the identifier parameter.
834 // Returns false if the token is not of type IDENTFIER.
ConsumeIdentifier(string * identifier)835 bool ConsumeIdentifier(string* identifier) {
836 if (LookingAtType(io::Tokenizer::TYPE_IDENTIFIER)) {
837 *identifier = tokenizer_.current().text;
838 tokenizer_.Next();
839 return true;
840 }
841
842 // If allow_field_numer_ or allow_unknown_field_ is true, we should able
843 // to parse integer identifiers.
844 if ((allow_field_number_ || allow_unknown_field_)
845 && LookingAtType(io::Tokenizer::TYPE_INTEGER)) {
846 *identifier = tokenizer_.current().text;
847 tokenizer_.Next();
848 return true;
849 }
850
851 ReportError("Expected identifier, got: " + tokenizer_.current().text);
852 return false;
853 }
854
855 // Consume a string of form "<id1>.<id2>....<idN>".
ConsumeFullTypeName(string * name)856 bool ConsumeFullTypeName(string* name) {
857 DO(ConsumeIdentifier(name));
858 while (TryConsume(".")) {
859 string part;
860 DO(ConsumeIdentifier(&part));
861 *name += ".";
862 *name += part;
863 }
864 return true;
865 }
866
867 // Consumes a string and saves its value in the text parameter.
868 // Returns false if the token is not of type STRING.
ConsumeString(string * text)869 bool ConsumeString(string* text) {
870 if (!LookingAtType(io::Tokenizer::TYPE_STRING)) {
871 ReportError("Expected string, got: " + tokenizer_.current().text);
872 return false;
873 }
874
875 text->clear();
876 while (LookingAtType(io::Tokenizer::TYPE_STRING)) {
877 io::Tokenizer::ParseStringAppend(tokenizer_.current().text, text);
878
879 tokenizer_.Next();
880 }
881
882 return true;
883 }
884
885 // Consumes a uint64 and saves its value in the value parameter.
886 // Returns false if the token is not of type INTEGER.
ConsumeUnsignedInteger(uint64 * value,uint64 max_value)887 bool ConsumeUnsignedInteger(uint64* value, uint64 max_value) {
888 if (!LookingAtType(io::Tokenizer::TYPE_INTEGER)) {
889 ReportError("Expected integer, got: " + tokenizer_.current().text);
890 return false;
891 }
892
893 if (!io::Tokenizer::ParseInteger(tokenizer_.current().text,
894 max_value, value)) {
895 ReportError("Integer out of range (" + tokenizer_.current().text + ")");
896 return false;
897 }
898
899 tokenizer_.Next();
900 return true;
901 }
902
903 // Consumes an int64 and saves its value in the value parameter.
904 // Note that since the tokenizer does not support negative numbers,
905 // we actually may consume an additional token (for the minus sign) in this
906 // method. Returns false if the token is not an integer
907 // (signed or otherwise).
ConsumeSignedInteger(int64 * value,uint64 max_value)908 bool ConsumeSignedInteger(int64* value, uint64 max_value) {
909 bool negative = false;
910
911 if (TryConsume("-")) {
912 negative = true;
913 // Two's complement always allows one more negative integer than
914 // positive.
915 ++max_value;
916 }
917
918 uint64 unsigned_value;
919
920 DO(ConsumeUnsignedInteger(&unsigned_value, max_value));
921
922 if (negative) {
923 if ((static_cast<uint64>(kint64max) + 1) == unsigned_value) {
924 *value = kint64min;
925 } else {
926 *value = -static_cast<int64>(unsigned_value);
927 }
928 } else {
929 *value = static_cast<int64>(unsigned_value);
930 }
931
932 return true;
933 }
934
935 // Consumes a uint64 and saves its value in the value parameter.
936 // Accepts decimal numbers only, rejects hex or oct numbers.
ConsumeUnsignedDecimalInteger(uint64 * value,uint64 max_value)937 bool ConsumeUnsignedDecimalInteger(uint64* value, uint64 max_value) {
938 if (!LookingAtType(io::Tokenizer::TYPE_INTEGER)) {
939 ReportError("Expected integer, got: " + tokenizer_.current().text);
940 return false;
941 }
942
943 const string& text = tokenizer_.current().text;
944 if (IsHexNumber(text) || IsOctNumber(text)) {
945 ReportError("Expect a decimal number, got: " + text);
946 return false;
947 }
948
949 if (!io::Tokenizer::ParseInteger(text, max_value, value)) {
950 ReportError("Integer out of range (" + text + ")");
951 return false;
952 }
953
954 tokenizer_.Next();
955 return true;
956 }
957
958 // Consumes a double and saves its value in the value parameter.
959 // Note that since the tokenizer does not support negative numbers,
960 // we actually may consume an additional token (for the minus sign) in this
961 // method. Returns false if the token is not a double
962 // (signed or otherwise).
ConsumeDouble(double * value)963 bool ConsumeDouble(double* value) {
964 bool negative = false;
965
966 if (TryConsume("-")) {
967 negative = true;
968 }
969
970 // A double can actually be an integer, according to the tokenizer.
971 // Therefore, we must check both cases here.
972 if (LookingAtType(io::Tokenizer::TYPE_INTEGER)) {
973 // We have found an integer value for the double.
974 uint64 integer_value;
975 DO(ConsumeUnsignedDecimalInteger(&integer_value, kuint64max));
976
977 *value = static_cast<double>(integer_value);
978 } else if (LookingAtType(io::Tokenizer::TYPE_FLOAT)) {
979 // We have found a float value for the double.
980 *value = io::Tokenizer::ParseFloat(tokenizer_.current().text);
981
982 // Mark the current token as consumed.
983 tokenizer_.Next();
984 } else if (LookingAtType(io::Tokenizer::TYPE_IDENTIFIER)) {
985 string text = tokenizer_.current().text;
986 LowerString(&text);
987 if (text == "inf" ||
988 text == "infinity") {
989 *value = std::numeric_limits<double>::infinity();
990 tokenizer_.Next();
991 } else if (text == "nan") {
992 *value = std::numeric_limits<double>::quiet_NaN();
993 tokenizer_.Next();
994 } else {
995 ReportError("Expected double, got: " + text);
996 return false;
997 }
998 } else {
999 ReportError("Expected double, got: " + tokenizer_.current().text);
1000 return false;
1001 }
1002
1003 if (negative) {
1004 *value = -*value;
1005 }
1006
1007 return true;
1008 }
1009
1010 // Consumes Any::type_url value, of form "type.googleapis.com/full.type.Name"
1011 // or "type.googleprod.com/full.type.Name"
ConsumeAnyTypeUrl(string * full_type_name,string * prefix)1012 bool ConsumeAnyTypeUrl(string* full_type_name, string* prefix) {
1013 // TODO(saito) Extend Consume() to consume multiple tokens at once, so that
1014 // this code can be written as just DO(Consume(kGoogleApisTypePrefix)).
1015 string url1, url2, url3;
1016 DO(ConsumeIdentifier(&url1)); // type
1017 DO(Consume("."));
1018 DO(ConsumeIdentifier(&url2)); // googleapis
1019 DO(Consume("."));
1020 DO(ConsumeIdentifier(&url3)); // com
1021 DO(Consume("/"));
1022 DO(ConsumeFullTypeName(full_type_name));
1023
1024 *prefix = url1 + "." + url2 + "." + url3 + "/";
1025 if (*prefix != internal::kTypeGoogleApisComPrefix &&
1026 *prefix != internal::kTypeGoogleProdComPrefix) {
1027 ReportError("TextFormat::Parser for Any supports only "
1028 "type.googleapis.com and type.googleprod.com, "
1029 "but found \"" + *prefix + "\"");
1030 return false;
1031 }
1032 return true;
1033 }
1034
1035 // A helper function for reconstructing Any::value. Consumes a text of
1036 // full_type_name, then serializes it into serialized_value. "pool" is used to
1037 // look up and create a temporary object with full_type_name.
ConsumeAnyValue(const string & full_type_name,const DescriptorPool * pool,string * serialized_value)1038 bool ConsumeAnyValue(const string& full_type_name, const DescriptorPool* pool,
1039 string* serialized_value) {
1040 const Descriptor* value_descriptor =
1041 pool->FindMessageTypeByName(full_type_name);
1042 if (value_descriptor == NULL) {
1043 ReportError("Could not find type \"" + full_type_name +
1044 "\" stored in google.protobuf.Any.");
1045 return false;
1046 }
1047 DynamicMessageFactory factory;
1048 const Message* value_prototype = factory.GetPrototype(value_descriptor);
1049 if (value_prototype == NULL) {
1050 return false;
1051 }
1052 google::protobuf::scoped_ptr<Message> value(value_prototype->New());
1053 string sub_delimiter;
1054 DO(ConsumeMessageDelimiter(&sub_delimiter));
1055 DO(ConsumeMessage(value.get(), sub_delimiter));
1056
1057 if (allow_partial_) {
1058 value->AppendPartialToString(serialized_value);
1059 } else {
1060 if (!value->IsInitialized()) {
1061 ReportError(
1062 "Value of type \"" + full_type_name +
1063 "\" stored in google.protobuf.Any has missing required fields");
1064 return false;
1065 }
1066 value->AppendToString(serialized_value);
1067 }
1068 return true;
1069 }
1070
1071 // Consumes a token and confirms that it matches that specified in the
1072 // value parameter. Returns false if the token found does not match that
1073 // which was specified.
Consume(const string & value)1074 bool Consume(const string& value) {
1075 const string& current_value = tokenizer_.current().text;
1076
1077 if (current_value != value) {
1078 ReportError("Expected \"" + value + "\", found \"" + current_value
1079 + "\".");
1080 return false;
1081 }
1082
1083 tokenizer_.Next();
1084
1085 return true;
1086 }
1087
1088 // Attempts to consume the supplied value. Returns false if a the
1089 // token found does not match the value specified.
TryConsume(const string & value)1090 bool TryConsume(const string& value) {
1091 if (tokenizer_.current().text == value) {
1092 tokenizer_.Next();
1093 return true;
1094 } else {
1095 return false;
1096 }
1097 }
1098
1099 // An internal instance of the Tokenizer's error collector, used to
1100 // collect any base-level parse errors and feed them to the ParserImpl.
1101 class ParserErrorCollector : public io::ErrorCollector {
1102 public:
ParserErrorCollector(TextFormat::Parser::ParserImpl * parser)1103 explicit ParserErrorCollector(TextFormat::Parser::ParserImpl* parser) :
1104 parser_(parser) { }
1105
~ParserErrorCollector()1106 virtual ~ParserErrorCollector() { }
1107
AddError(int line,int column,const string & message)1108 virtual void AddError(int line, int column, const string& message) {
1109 parser_->ReportError(line, column, message);
1110 }
1111
AddWarning(int line,int column,const string & message)1112 virtual void AddWarning(int line, int column, const string& message) {
1113 parser_->ReportWarning(line, column, message);
1114 }
1115
1116 private:
1117 GOOGLE_DISALLOW_EVIL_CONSTRUCTORS(ParserErrorCollector);
1118 TextFormat::Parser::ParserImpl* parser_;
1119 };
1120
1121 io::ErrorCollector* error_collector_;
1122 TextFormat::Finder* finder_;
1123 ParseInfoTree* parse_info_tree_;
1124 ParserErrorCollector tokenizer_error_collector_;
1125 io::Tokenizer tokenizer_;
1126 const Descriptor* root_message_type_;
1127 SingularOverwritePolicy singular_overwrite_policy_;
1128 const bool allow_case_insensitive_field_;
1129 const bool allow_unknown_field_;
1130 const bool allow_unknown_enum_;
1131 const bool allow_field_number_;
1132 const bool allow_partial_;
1133 bool had_errors_;
1134 };
1135
1136 #undef DO
1137
1138 // ===========================================================================
1139 // Internal class for writing text to the io::ZeroCopyOutputStream. Adapted
1140 // from the Printer found in //google/protobuf/io/printer.h
1141 class TextFormat::Printer::TextGenerator {
1142 public:
TextGenerator(io::ZeroCopyOutputStream * output,int initial_indent_level)1143 explicit TextGenerator(io::ZeroCopyOutputStream* output,
1144 int initial_indent_level)
1145 : output_(output),
1146 buffer_(NULL),
1147 buffer_size_(0),
1148 at_start_of_line_(true),
1149 failed_(false),
1150 indent_(""),
1151 initial_indent_level_(initial_indent_level) {
1152 indent_.resize(initial_indent_level_ * 2, ' ');
1153 }
1154
~TextGenerator()1155 ~TextGenerator() {
1156 // Only BackUp() if we're sure we've successfully called Next() at least
1157 // once.
1158 if (!failed_ && buffer_size_ > 0) {
1159 output_->BackUp(buffer_size_);
1160 }
1161 }
1162
1163 // Indent text by two spaces. After calling Indent(), two spaces will be
1164 // inserted at the beginning of each line of text. Indent() may be called
1165 // multiple times to produce deeper indents.
Indent()1166 void Indent() {
1167 indent_ += " ";
1168 }
1169
1170 // Reduces the current indent level by two spaces, or crashes if the indent
1171 // level is zero.
Outdent()1172 void Outdent() {
1173 if (indent_.empty() ||
1174 indent_.size() < initial_indent_level_ * 2) {
1175 GOOGLE_LOG(DFATAL) << " Outdent() without matching Indent().";
1176 return;
1177 }
1178
1179 indent_.resize(indent_.size() - 2);
1180 }
1181
1182 // Print text to the output stream.
Print(const string & str)1183 void Print(const string& str) {
1184 Print(str.data(), str.size());
1185 }
1186
1187 // Print text to the output stream.
Print(const char * text)1188 void Print(const char* text) {
1189 Print(text, strlen(text));
1190 }
1191
1192 // Print text to the output stream.
Print(const char * text,size_t size)1193 void Print(const char* text, size_t size) {
1194 size_t pos = 0; // The number of bytes we've written so far.
1195
1196 for (size_t i = 0; i < size; i++) {
1197 if (text[i] == '\n') {
1198 // Saw newline. If there is more text, we may need to insert an indent
1199 // here. So, write what we have so far, including the '\n'.
1200 Write(text + pos, i - pos + 1);
1201 pos = i + 1;
1202
1203 // Setting this true will cause the next Write() to insert an indent
1204 // first.
1205 at_start_of_line_ = true;
1206 }
1207 }
1208
1209 // Write the rest.
1210 Write(text + pos, size - pos);
1211 }
1212
1213 // True if any write to the underlying stream failed. (We don't just
1214 // crash in this case because this is an I/O failure, not a programming
1215 // error.)
failed() const1216 bool failed() const { return failed_; }
1217
1218 private:
1219 GOOGLE_DISALLOW_EVIL_CONSTRUCTORS(TextGenerator);
1220
Write(const char * data,size_t size)1221 void Write(const char* data, size_t size) {
1222 if (failed_) return;
1223 if (size == 0) return;
1224
1225 if (at_start_of_line_) {
1226 // Insert an indent.
1227 at_start_of_line_ = false;
1228 Write(indent_.data(), indent_.size());
1229 if (failed_) return;
1230 }
1231
1232 while (size > buffer_size_) {
1233 // Data exceeds space in the buffer. Copy what we can and request a
1234 // new buffer.
1235 memcpy(buffer_, data, buffer_size_);
1236 data += buffer_size_;
1237 size -= buffer_size_;
1238 void* void_buffer;
1239 failed_ = !output_->Next(&void_buffer, &buffer_size_);
1240 if (failed_) return;
1241 buffer_ = reinterpret_cast<char*>(void_buffer);
1242 }
1243
1244 // Buffer is big enough to receive the data; copy it.
1245 memcpy(buffer_, data, size);
1246 buffer_ += size;
1247 buffer_size_ -= size;
1248 }
1249
1250 io::ZeroCopyOutputStream* const output_;
1251 char* buffer_;
1252 int buffer_size_;
1253 bool at_start_of_line_;
1254 bool failed_;
1255
1256 string indent_;
1257 int initial_indent_level_;
1258 };
1259
1260 // ===========================================================================
1261
~Finder()1262 TextFormat::Finder::~Finder() {
1263 }
1264
Parser()1265 TextFormat::Parser::Parser()
1266 : error_collector_(NULL),
1267 finder_(NULL),
1268 parse_info_tree_(NULL),
1269 allow_partial_(false),
1270 allow_case_insensitive_field_(false),
1271 allow_unknown_field_(false),
1272 allow_unknown_enum_(false),
1273 allow_field_number_(false),
1274 allow_relaxed_whitespace_(false),
1275 allow_singular_overwrites_(false) {
1276 }
1277
~Parser()1278 TextFormat::Parser::~Parser() {}
1279
Parse(io::ZeroCopyInputStream * input,Message * output)1280 bool TextFormat::Parser::Parse(io::ZeroCopyInputStream* input,
1281 Message* output) {
1282 output->Clear();
1283
1284 ParserImpl::SingularOverwritePolicy overwrites_policy =
1285 allow_singular_overwrites_
1286 ? ParserImpl::ALLOW_SINGULAR_OVERWRITES
1287 : ParserImpl::FORBID_SINGULAR_OVERWRITES;
1288
1289 ParserImpl parser(output->GetDescriptor(), input, error_collector_,
1290 finder_, parse_info_tree_,
1291 overwrites_policy,
1292 allow_case_insensitive_field_, allow_unknown_field_,
1293 allow_unknown_enum_, allow_field_number_,
1294 allow_relaxed_whitespace_, allow_partial_);
1295 return MergeUsingImpl(input, output, &parser);
1296 }
1297
ParseFromString(const string & input,Message * output)1298 bool TextFormat::Parser::ParseFromString(const string& input,
1299 Message* output) {
1300 io::ArrayInputStream input_stream(input.data(), input.size());
1301 return Parse(&input_stream, output);
1302 }
1303
Merge(io::ZeroCopyInputStream * input,Message * output)1304 bool TextFormat::Parser::Merge(io::ZeroCopyInputStream* input,
1305 Message* output) {
1306 ParserImpl parser(output->GetDescriptor(), input, error_collector_,
1307 finder_, parse_info_tree_,
1308 ParserImpl::ALLOW_SINGULAR_OVERWRITES,
1309 allow_case_insensitive_field_, allow_unknown_field_,
1310 allow_unknown_enum_, allow_field_number_,
1311 allow_relaxed_whitespace_, allow_partial_);
1312 return MergeUsingImpl(input, output, &parser);
1313 }
1314
MergeFromString(const string & input,Message * output)1315 bool TextFormat::Parser::MergeFromString(const string& input,
1316 Message* output) {
1317 io::ArrayInputStream input_stream(input.data(), input.size());
1318 return Merge(&input_stream, output);
1319 }
1320
MergeUsingImpl(io::ZeroCopyInputStream *,Message * output,ParserImpl * parser_impl)1321 bool TextFormat::Parser::MergeUsingImpl(io::ZeroCopyInputStream* /* input */,
1322 Message* output,
1323 ParserImpl* parser_impl) {
1324 if (!parser_impl->Parse(output)) return false;
1325 if (!allow_partial_ && !output->IsInitialized()) {
1326 vector<string> missing_fields;
1327 output->FindInitializationErrors(&missing_fields);
1328 parser_impl->ReportError(-1, 0, "Message missing required fields: " +
1329 Join(missing_fields, ", "));
1330 return false;
1331 }
1332 return true;
1333 }
1334
ParseFieldValueFromString(const string & input,const FieldDescriptor * field,Message * output)1335 bool TextFormat::Parser::ParseFieldValueFromString(
1336 const string& input,
1337 const FieldDescriptor* field,
1338 Message* output) {
1339 io::ArrayInputStream input_stream(input.data(), input.size());
1340 ParserImpl parser(output->GetDescriptor(), &input_stream, error_collector_,
1341 finder_, parse_info_tree_,
1342 ParserImpl::ALLOW_SINGULAR_OVERWRITES,
1343 allow_case_insensitive_field_, allow_unknown_field_,
1344 allow_unknown_enum_, allow_field_number_,
1345 allow_relaxed_whitespace_, allow_partial_);
1346 return parser.ParseField(field, output);
1347 }
1348
Parse(io::ZeroCopyInputStream * input,Message * output)1349 /* static */ bool TextFormat::Parse(io::ZeroCopyInputStream* input,
1350 Message* output) {
1351 return Parser().Parse(input, output);
1352 }
1353
Merge(io::ZeroCopyInputStream * input,Message * output)1354 /* static */ bool TextFormat::Merge(io::ZeroCopyInputStream* input,
1355 Message* output) {
1356 return Parser().Merge(input, output);
1357 }
1358
ParseFromString(const string & input,Message * output)1359 /* static */ bool TextFormat::ParseFromString(const string& input,
1360 Message* output) {
1361 return Parser().ParseFromString(input, output);
1362 }
1363
MergeFromString(const string & input,Message * output)1364 /* static */ bool TextFormat::MergeFromString(const string& input,
1365 Message* output) {
1366 return Parser().MergeFromString(input, output);
1367 }
1368
1369 // ===========================================================================
1370
1371 // The default implementation for FieldValuePrinter. The base class just
1372 // does simple formatting. That way, deriving classes could decide to fallback
1373 // to that behavior.
FieldValuePrinter()1374 TextFormat::FieldValuePrinter::FieldValuePrinter() {}
~FieldValuePrinter()1375 TextFormat::FieldValuePrinter::~FieldValuePrinter() {}
PrintBool(bool val) const1376 string TextFormat::FieldValuePrinter::PrintBool(bool val) const {
1377 return val ? "true" : "false";
1378 }
PrintInt32(int32 val) const1379 string TextFormat::FieldValuePrinter::PrintInt32(int32 val) const {
1380 return SimpleItoa(val);
1381 }
PrintUInt32(uint32 val) const1382 string TextFormat::FieldValuePrinter::PrintUInt32(uint32 val) const {
1383 return SimpleItoa(val);
1384 }
PrintInt64(int64 val) const1385 string TextFormat::FieldValuePrinter::PrintInt64(int64 val) const {
1386 return SimpleItoa(val);
1387 }
PrintUInt64(uint64 val) const1388 string TextFormat::FieldValuePrinter::PrintUInt64(uint64 val) const {
1389 return SimpleItoa(val);
1390 }
PrintFloat(float val) const1391 string TextFormat::FieldValuePrinter::PrintFloat(float val) const {
1392 return SimpleFtoa(val);
1393 }
PrintDouble(double val) const1394 string TextFormat::FieldValuePrinter::PrintDouble(double val) const {
1395 return SimpleDtoa(val);
1396 }
PrintString(const string & val) const1397 string TextFormat::FieldValuePrinter::PrintString(const string& val) const {
1398 string printed("\"");
1399 CEscapeAndAppend(val, &printed);
1400 printed.push_back('\"');
1401 return printed;
1402 }
PrintBytes(const string & val) const1403 string TextFormat::FieldValuePrinter::PrintBytes(const string& val) const {
1404 return PrintString(val);
1405 }
PrintEnum(int32 val,const string & name) const1406 string TextFormat::FieldValuePrinter::PrintEnum(int32 val,
1407 const string& name) const {
1408 return name;
1409 }
PrintFieldName(const Message & message,const Reflection * reflection,const FieldDescriptor * field) const1410 string TextFormat::FieldValuePrinter::PrintFieldName(
1411 const Message& message,
1412 const Reflection* reflection,
1413 const FieldDescriptor* field) const {
1414 if (field->is_extension()) {
1415 // We special-case MessageSet elements for compatibility with proto1.
1416 if (field->containing_type()->options().message_set_wire_format()
1417 && field->type() == FieldDescriptor::TYPE_MESSAGE
1418 && field->is_optional()
1419 && field->extension_scope() == field->message_type()) {
1420 return StrCat("[", field->message_type()->full_name(), "]");
1421 } else {
1422 return StrCat("[", field->full_name(), "]");
1423 }
1424 } else if (field->type() == FieldDescriptor::TYPE_GROUP) {
1425 // Groups must be serialized with their original capitalization.
1426 return field->message_type()->name();
1427 } else {
1428 return field->name();
1429 }
1430 }
PrintMessageStart(const Message & message,int field_index,int field_count,bool single_line_mode) const1431 string TextFormat::FieldValuePrinter::PrintMessageStart(
1432 const Message& message,
1433 int field_index,
1434 int field_count,
1435 bool single_line_mode) const {
1436 return single_line_mode ? " { " : " {\n";
1437 }
PrintMessageEnd(const Message & message,int field_index,int field_count,bool single_line_mode) const1438 string TextFormat::FieldValuePrinter::PrintMessageEnd(
1439 const Message& message,
1440 int field_index,
1441 int field_count,
1442 bool single_line_mode) const {
1443 return single_line_mode ? "} " : "}\n";
1444 }
1445
1446 namespace {
1447 // Our own specialization: for UTF8 escaped strings.
1448 class FieldValuePrinterUtf8Escaping : public TextFormat::FieldValuePrinter {
1449 public:
PrintString(const string & val) const1450 virtual string PrintString(const string& val) const {
1451 return StrCat("\"", strings::Utf8SafeCEscape(val), "\"");
1452 }
PrintBytes(const string & val) const1453 virtual string PrintBytes(const string& val) const {
1454 return TextFormat::FieldValuePrinter::PrintString(val);
1455 }
1456 };
1457
1458 } // namespace
1459
Printer()1460 TextFormat::Printer::Printer()
1461 : initial_indent_level_(0),
1462 single_line_mode_(false),
1463 use_field_number_(false),
1464 use_short_repeated_primitives_(false),
1465 hide_unknown_fields_(false),
1466 print_message_fields_in_index_order_(false),
1467 expand_any_(false),
1468 truncate_string_field_longer_than_(0LL) {
1469 SetUseUtf8StringEscaping(false);
1470 }
1471
~Printer()1472 TextFormat::Printer::~Printer() {
1473 STLDeleteValues(&custom_printers_);
1474 }
1475
SetUseUtf8StringEscaping(bool as_utf8)1476 void TextFormat::Printer::SetUseUtf8StringEscaping(bool as_utf8) {
1477 SetDefaultFieldValuePrinter(as_utf8
1478 ? new FieldValuePrinterUtf8Escaping()
1479 : new FieldValuePrinter());
1480 }
1481
SetDefaultFieldValuePrinter(const FieldValuePrinter * printer)1482 void TextFormat::Printer::SetDefaultFieldValuePrinter(
1483 const FieldValuePrinter* printer) {
1484 default_field_value_printer_.reset(printer);
1485 }
1486
RegisterFieldValuePrinter(const FieldDescriptor * field,const FieldValuePrinter * printer)1487 bool TextFormat::Printer::RegisterFieldValuePrinter(
1488 const FieldDescriptor* field,
1489 const FieldValuePrinter* printer) {
1490 return field != NULL && printer != NULL &&
1491 custom_printers_.insert(std::make_pair(field, printer)).second;
1492 }
1493
PrintToString(const Message & message,string * output) const1494 bool TextFormat::Printer::PrintToString(const Message& message,
1495 string* output) const {
1496 GOOGLE_DCHECK(output) << "output specified is NULL";
1497
1498 output->clear();
1499 io::StringOutputStream output_stream(output);
1500
1501 return Print(message, &output_stream);
1502 }
1503
PrintUnknownFieldsToString(const UnknownFieldSet & unknown_fields,string * output) const1504 bool TextFormat::Printer::PrintUnknownFieldsToString(
1505 const UnknownFieldSet& unknown_fields,
1506 string* output) const {
1507 GOOGLE_DCHECK(output) << "output specified is NULL";
1508
1509 output->clear();
1510 io::StringOutputStream output_stream(output);
1511 return PrintUnknownFields(unknown_fields, &output_stream);
1512 }
1513
Print(const Message & message,io::ZeroCopyOutputStream * output) const1514 bool TextFormat::Printer::Print(const Message& message,
1515 io::ZeroCopyOutputStream* output) const {
1516 TextGenerator generator(output, initial_indent_level_);
1517
1518 Print(message, generator);
1519
1520 // Output false if the generator failed internally.
1521 return !generator.failed();
1522 }
1523
PrintUnknownFields(const UnknownFieldSet & unknown_fields,io::ZeroCopyOutputStream * output) const1524 bool TextFormat::Printer::PrintUnknownFields(
1525 const UnknownFieldSet& unknown_fields,
1526 io::ZeroCopyOutputStream* output) const {
1527 TextGenerator generator(output, initial_indent_level_);
1528
1529 PrintUnknownFields(unknown_fields, generator);
1530
1531 // Output false if the generator failed internally.
1532 return !generator.failed();
1533 }
1534
1535 namespace {
1536 // Comparison functor for sorting FieldDescriptors by field index.
1537 struct FieldIndexSorter {
operator ()google::protobuf::__anonb10ba4750311::FieldIndexSorter1538 bool operator()(const FieldDescriptor* left,
1539 const FieldDescriptor* right) const {
1540 return left->index() < right->index();
1541 }
1542 };
1543
1544 } // namespace
1545
PrintAny(const Message & message,TextGenerator & generator) const1546 bool TextFormat::Printer::PrintAny(const Message& message,
1547 TextGenerator& generator) const {
1548 const FieldDescriptor* type_url_field;
1549 const FieldDescriptor* value_field;
1550 if (!internal::GetAnyFieldDescriptors(message, &type_url_field,
1551 &value_field)) {
1552 return false;
1553 }
1554
1555 const Reflection* reflection = message.GetReflection();
1556
1557 // Extract the full type name from the type_url field.
1558 const string& type_url = reflection->GetString(message, type_url_field);
1559 string full_type_name;
1560 if (!internal::ParseAnyTypeUrl(type_url, &full_type_name)) {
1561 return false;
1562 }
1563
1564 // Print the "value" in text.
1565 const google::protobuf::Descriptor* value_descriptor =
1566 message.GetDescriptor()->file()->pool()->FindMessageTypeByName(
1567 full_type_name);
1568 if (value_descriptor == NULL) {
1569 GOOGLE_LOG(WARNING) << "Proto type " << type_url << " not found";
1570 return false;
1571 }
1572 DynamicMessageFactory factory;
1573 google::protobuf::scoped_ptr<google::protobuf::Message> value_message(
1574 factory.GetPrototype(value_descriptor)->New());
1575 string serialized_value = reflection->GetString(message, value_field);
1576 if (!value_message->ParseFromString(serialized_value)) {
1577 GOOGLE_LOG(WARNING) << type_url << ": failed to parse contents";
1578 return false;
1579 }
1580 generator.Print(StrCat("[", type_url, "]"));
1581 const FieldValuePrinter* printer = FindWithDefault(
1582 custom_printers_, value_field, default_field_value_printer_.get());
1583 generator.Print(
1584 printer->PrintMessageStart(message, -1, 0, single_line_mode_));
1585 generator.Indent();
1586 Print(*value_message, generator);
1587 generator.Outdent();
1588 generator.Print(printer->PrintMessageEnd(message, -1, 0, single_line_mode_));
1589 return true;
1590 }
1591
Print(const Message & message,TextGenerator & generator) const1592 void TextFormat::Printer::Print(const Message& message,
1593 TextGenerator& generator) const {
1594 const Descriptor* descriptor = message.GetDescriptor();
1595 const Reflection* reflection = message.GetReflection();
1596 if (descriptor->full_name() == internal::kAnyFullTypeName && expand_any_ &&
1597 PrintAny(message, generator)) {
1598 return;
1599 }
1600 vector<const FieldDescriptor*> fields;
1601 reflection->ListFields(message, &fields);
1602 if (print_message_fields_in_index_order_) {
1603 std::sort(fields.begin(), fields.end(), FieldIndexSorter());
1604 }
1605 for (int i = 0; i < fields.size(); i++) {
1606 PrintField(message, reflection, fields[i], generator);
1607 }
1608 if (!hide_unknown_fields_) {
1609 PrintUnknownFields(reflection->GetUnknownFields(message), generator);
1610 }
1611 }
1612
PrintFieldValueToString(const Message & message,const FieldDescriptor * field,int index,string * output) const1613 void TextFormat::Printer::PrintFieldValueToString(
1614 const Message& message,
1615 const FieldDescriptor* field,
1616 int index,
1617 string* output) const {
1618
1619 GOOGLE_DCHECK(output) << "output specified is NULL";
1620
1621 output->clear();
1622 io::StringOutputStream output_stream(output);
1623 TextGenerator generator(&output_stream, initial_indent_level_);
1624
1625 PrintFieldValue(message, message.GetReflection(), field, index, generator);
1626 }
1627
1628 class MapEntryMessageComparator {
1629 public:
MapEntryMessageComparator(const Descriptor * descriptor)1630 explicit MapEntryMessageComparator(const Descriptor* descriptor)
1631 : field_(descriptor->field(0)) {}
1632
operator ()(const Message * a,const Message * b)1633 bool operator()(const Message* a, const Message* b) {
1634 const Reflection* reflection = a->GetReflection();
1635 switch (field_->cpp_type()) {
1636 case FieldDescriptor::CPPTYPE_BOOL: {
1637 bool first = reflection->GetBool(*a, field_);
1638 bool second = reflection->GetBool(*b, field_);
1639 return first < second;
1640 }
1641 case FieldDescriptor::CPPTYPE_INT32: {
1642 int32 first = reflection->GetInt32(*a, field_);
1643 int32 second = reflection->GetInt32(*b, field_);
1644 return first < second;
1645 }
1646 case FieldDescriptor::CPPTYPE_INT64: {
1647 int64 first = reflection->GetInt64(*a, field_);
1648 int64 second = reflection->GetInt64(*b, field_);
1649 return first < second;
1650 }
1651 case FieldDescriptor::CPPTYPE_UINT32: {
1652 uint32 first = reflection->GetUInt32(*a, field_);
1653 uint32 second = reflection->GetUInt32(*b, field_);
1654 return first < second;
1655 }
1656 case FieldDescriptor::CPPTYPE_UINT64: {
1657 uint64 first = reflection->GetUInt64(*a, field_);
1658 uint64 second = reflection->GetUInt64(*b, field_);
1659 return first < second;
1660 }
1661 case FieldDescriptor::CPPTYPE_STRING: {
1662 string first = reflection->GetString(*a, field_);
1663 string second = reflection->GetString(*b, field_);
1664 return first < second;
1665 }
1666 default:
1667 GOOGLE_LOG(DFATAL) << "Invalid key for map field.";
1668 return true;
1669 }
1670 }
1671
1672 private:
1673 const FieldDescriptor* field_;
1674 };
1675
PrintField(const Message & message,const Reflection * reflection,const FieldDescriptor * field,TextGenerator & generator) const1676 void TextFormat::Printer::PrintField(const Message& message,
1677 const Reflection* reflection,
1678 const FieldDescriptor* field,
1679 TextGenerator& generator) const {
1680 if (use_short_repeated_primitives_ &&
1681 field->is_repeated() &&
1682 field->cpp_type() != FieldDescriptor::CPPTYPE_STRING &&
1683 field->cpp_type() != FieldDescriptor::CPPTYPE_MESSAGE) {
1684 PrintShortRepeatedField(message, reflection, field, generator);
1685 return;
1686 }
1687
1688 int count = 0;
1689
1690 if (field->is_repeated()) {
1691 count = reflection->FieldSize(message, field);
1692 } else if (reflection->HasField(message, field)) {
1693 count = 1;
1694 }
1695
1696 std::vector<const Message*> sorted_map_field;
1697 if (field->is_map()) {
1698 const RepeatedPtrField<Message>& map_field =
1699 reflection->GetRepeatedPtrField<Message>(message, field);
1700 for (RepeatedPtrField<Message>::const_pointer_iterator it =
1701 map_field.pointer_begin();
1702 it != map_field.pointer_end(); ++it) {
1703 sorted_map_field.push_back(*it);
1704 }
1705
1706 MapEntryMessageComparator comparator(field->message_type());
1707 std::stable_sort(sorted_map_field.begin(), sorted_map_field.end(),
1708 comparator);
1709 }
1710
1711 for (int j = 0; j < count; ++j) {
1712 const int field_index = field->is_repeated() ? j : -1;
1713
1714 PrintFieldName(message, reflection, field, generator);
1715
1716 if (field->cpp_type() == FieldDescriptor::CPPTYPE_MESSAGE) {
1717 const FieldValuePrinter* printer = FindWithDefault(
1718 custom_printers_, field, default_field_value_printer_.get());
1719 const Message& sub_message =
1720 field->is_repeated()
1721 ? (field->is_map()
1722 ? *sorted_map_field[j]
1723 : reflection->GetRepeatedMessage(message, field, j))
1724 : reflection->GetMessage(message, field);
1725 generator.Print(
1726 printer->PrintMessageStart(
1727 sub_message, field_index, count, single_line_mode_));
1728 generator.Indent();
1729 Print(sub_message, generator);
1730 generator.Outdent();
1731 generator.Print(
1732 printer->PrintMessageEnd(
1733 sub_message, field_index, count, single_line_mode_));
1734 } else {
1735 generator.Print(": ");
1736 // Write the field value.
1737 PrintFieldValue(message, reflection, field, field_index, generator);
1738 if (single_line_mode_) {
1739 generator.Print(" ");
1740 } else {
1741 generator.Print("\n");
1742 }
1743 }
1744 }
1745 }
1746
PrintShortRepeatedField(const Message & message,const Reflection * reflection,const FieldDescriptor * field,TextGenerator & generator) const1747 void TextFormat::Printer::PrintShortRepeatedField(
1748 const Message& message,
1749 const Reflection* reflection,
1750 const FieldDescriptor* field,
1751 TextGenerator& generator) const {
1752 // Print primitive repeated field in short form.
1753 PrintFieldName(message, reflection, field, generator);
1754
1755 int size = reflection->FieldSize(message, field);
1756 generator.Print(": [");
1757 for (int i = 0; i < size; i++) {
1758 if (i > 0) generator.Print(", ");
1759 PrintFieldValue(message, reflection, field, i, generator);
1760 }
1761 if (single_line_mode_) {
1762 generator.Print("] ");
1763 } else {
1764 generator.Print("]\n");
1765 }
1766 }
1767
PrintFieldName(const Message & message,const Reflection * reflection,const FieldDescriptor * field,TextGenerator & generator) const1768 void TextFormat::Printer::PrintFieldName(const Message& message,
1769 const Reflection* reflection,
1770 const FieldDescriptor* field,
1771 TextGenerator& generator) const {
1772 // if use_field_number_ is true, prints field number instead
1773 // of field name.
1774 if (use_field_number_) {
1775 generator.Print(SimpleItoa(field->number()));
1776 return;
1777 }
1778
1779 const FieldValuePrinter* printer = FindWithDefault(
1780 custom_printers_, field, default_field_value_printer_.get());
1781 generator.Print(printer->PrintFieldName(message, reflection, field));
1782 }
1783
PrintFieldValue(const Message & message,const Reflection * reflection,const FieldDescriptor * field,int index,TextGenerator & generator) const1784 void TextFormat::Printer::PrintFieldValue(
1785 const Message& message,
1786 const Reflection* reflection,
1787 const FieldDescriptor* field,
1788 int index,
1789 TextGenerator& generator) const {
1790 GOOGLE_DCHECK(field->is_repeated() || (index == -1))
1791 << "Index must be -1 for non-repeated fields";
1792
1793 const FieldValuePrinter* printer
1794 = FindWithDefault(custom_printers_, field,
1795 default_field_value_printer_.get());
1796
1797 switch (field->cpp_type()) {
1798 #define OUTPUT_FIELD(CPPTYPE, METHOD) \
1799 case FieldDescriptor::CPPTYPE_##CPPTYPE: \
1800 generator.Print(printer->Print##METHOD(field->is_repeated() \
1801 ? reflection->GetRepeated##METHOD(message, field, index) \
1802 : reflection->Get##METHOD(message, field))); \
1803 break
1804
1805 OUTPUT_FIELD( INT32, Int32);
1806 OUTPUT_FIELD( INT64, Int64);
1807 OUTPUT_FIELD(UINT32, UInt32);
1808 OUTPUT_FIELD(UINT64, UInt64);
1809 OUTPUT_FIELD( FLOAT, Float);
1810 OUTPUT_FIELD(DOUBLE, Double);
1811 OUTPUT_FIELD( BOOL, Bool);
1812 #undef OUTPUT_FIELD
1813
1814 case FieldDescriptor::CPPTYPE_STRING: {
1815 string scratch;
1816 const string& value = field->is_repeated()
1817 ? reflection->GetRepeatedStringReference(
1818 message, field, index, &scratch)
1819 : reflection->GetStringReference(message, field, &scratch);
1820 const string* value_to_print = &value;
1821 string truncated_value;
1822 if (truncate_string_field_longer_than_ > 0 &&
1823 truncate_string_field_longer_than_ < value.size()) {
1824 truncated_value = value.substr(0, truncate_string_field_longer_than_) +
1825 "...<truncated>...";
1826 value_to_print = &truncated_value;
1827 }
1828 if (field->type() == FieldDescriptor::TYPE_STRING) {
1829 generator.Print(printer->PrintString(*value_to_print));
1830 } else {
1831 GOOGLE_DCHECK_EQ(field->type(), FieldDescriptor::TYPE_BYTES);
1832 generator.Print(printer->PrintBytes(*value_to_print));
1833 }
1834 break;
1835 }
1836
1837 case FieldDescriptor::CPPTYPE_ENUM: {
1838 int enum_value = field->is_repeated()
1839 ? reflection->GetRepeatedEnumValue(message, field, index)
1840 : reflection->GetEnumValue(message, field);
1841 const EnumValueDescriptor* enum_desc =
1842 field->enum_type()->FindValueByNumber(enum_value);
1843 if (enum_desc != NULL) {
1844 generator.Print(printer->PrintEnum(enum_value, enum_desc->name()));
1845 } else {
1846 // Ordinarily, enum_desc should not be null, because proto2 has the
1847 // invariant that set enum field values must be in-range, but with the
1848 // new integer-based API for enums (or the RepeatedField<int> loophole),
1849 // it is possible for the user to force an unknown integer value. So we
1850 // simply use the integer value itself as the enum value name in this
1851 // case.
1852 generator.Print(printer->PrintEnum(enum_value,
1853 StringPrintf("%d", enum_value)));
1854 }
1855 break;
1856 }
1857
1858 case FieldDescriptor::CPPTYPE_MESSAGE:
1859 Print(field->is_repeated()
1860 ? reflection->GetRepeatedMessage(message, field, index)
1861 : reflection->GetMessage(message, field),
1862 generator);
1863 break;
1864 }
1865 }
1866
Print(const Message & message,io::ZeroCopyOutputStream * output)1867 /* static */ bool TextFormat::Print(const Message& message,
1868 io::ZeroCopyOutputStream* output) {
1869 return Printer().Print(message, output);
1870 }
1871
PrintUnknownFields(const UnknownFieldSet & unknown_fields,io::ZeroCopyOutputStream * output)1872 /* static */ bool TextFormat::PrintUnknownFields(
1873 const UnknownFieldSet& unknown_fields,
1874 io::ZeroCopyOutputStream* output) {
1875 return Printer().PrintUnknownFields(unknown_fields, output);
1876 }
1877
PrintToString(const Message & message,string * output)1878 /* static */ bool TextFormat::PrintToString(
1879 const Message& message, string* output) {
1880 return Printer().PrintToString(message, output);
1881 }
1882
PrintUnknownFieldsToString(const UnknownFieldSet & unknown_fields,string * output)1883 /* static */ bool TextFormat::PrintUnknownFieldsToString(
1884 const UnknownFieldSet& unknown_fields, string* output) {
1885 return Printer().PrintUnknownFieldsToString(unknown_fields, output);
1886 }
1887
PrintFieldValueToString(const Message & message,const FieldDescriptor * field,int index,string * output)1888 /* static */ void TextFormat::PrintFieldValueToString(
1889 const Message& message,
1890 const FieldDescriptor* field,
1891 int index,
1892 string* output) {
1893 return Printer().PrintFieldValueToString(message, field, index, output);
1894 }
1895
ParseFieldValueFromString(const string & input,const FieldDescriptor * field,Message * message)1896 /* static */ bool TextFormat::ParseFieldValueFromString(
1897 const string& input,
1898 const FieldDescriptor* field,
1899 Message* message) {
1900 return Parser().ParseFieldValueFromString(input, field, message);
1901 }
1902
1903 // Prints an integer as hex with a fixed number of digits dependent on the
1904 // integer type.
1905 template<typename IntType>
PaddedHex(IntType value)1906 static string PaddedHex(IntType value) {
1907 string result;
1908 result.reserve(sizeof(value) * 2);
1909 for (int i = sizeof(value) * 2 - 1; i >= 0; i--) {
1910 result.push_back(int_to_hex_digit(value >> (i*4) & 0x0F));
1911 }
1912 return result;
1913 }
1914
PrintUnknownFields(const UnknownFieldSet & unknown_fields,TextGenerator & generator) const1915 void TextFormat::Printer::PrintUnknownFields(
1916 const UnknownFieldSet& unknown_fields, TextGenerator& generator) const {
1917 for (int i = 0; i < unknown_fields.field_count(); i++) {
1918 const UnknownField& field = unknown_fields.field(i);
1919 string field_number = SimpleItoa(field.number());
1920
1921 switch (field.type()) {
1922 case UnknownField::TYPE_VARINT:
1923 generator.Print(field_number);
1924 generator.Print(": ");
1925 generator.Print(SimpleItoa(field.varint()));
1926 if (single_line_mode_) {
1927 generator.Print(" ");
1928 } else {
1929 generator.Print("\n");
1930 }
1931 break;
1932 case UnknownField::TYPE_FIXED32: {
1933 generator.Print(field_number);
1934 generator.Print(": 0x");
1935 generator.Print(
1936 StrCat(strings::Hex(field.fixed32(), strings::ZERO_PAD_8)));
1937 if (single_line_mode_) {
1938 generator.Print(" ");
1939 } else {
1940 generator.Print("\n");
1941 }
1942 break;
1943 }
1944 case UnknownField::TYPE_FIXED64: {
1945 generator.Print(field_number);
1946 generator.Print(": 0x");
1947 generator.Print(
1948 StrCat(strings::Hex(field.fixed64(), strings::ZERO_PAD_16)));
1949 if (single_line_mode_) {
1950 generator.Print(" ");
1951 } else {
1952 generator.Print("\n");
1953 }
1954 break;
1955 }
1956 case UnknownField::TYPE_LENGTH_DELIMITED: {
1957 generator.Print(field_number);
1958 const string& value = field.length_delimited();
1959 UnknownFieldSet embedded_unknown_fields;
1960 if (!value.empty() && embedded_unknown_fields.ParseFromString(value)) {
1961 // This field is parseable as a Message.
1962 // So it is probably an embedded message.
1963 if (single_line_mode_) {
1964 generator.Print(" { ");
1965 } else {
1966 generator.Print(" {\n");
1967 generator.Indent();
1968 }
1969 PrintUnknownFields(embedded_unknown_fields, generator);
1970 if (single_line_mode_) {
1971 generator.Print("} ");
1972 } else {
1973 generator.Outdent();
1974 generator.Print("}\n");
1975 }
1976 } else {
1977 // This field is not parseable as a Message.
1978 // So it is probably just a plain string.
1979 string printed(": \"");
1980 CEscapeAndAppend(value, &printed);
1981 printed.append(single_line_mode_ ? "\" " : "\"\n");
1982 generator.Print(printed);
1983 }
1984 break;
1985 }
1986 case UnknownField::TYPE_GROUP:
1987 generator.Print(field_number);
1988 if (single_line_mode_) {
1989 generator.Print(" { ");
1990 } else {
1991 generator.Print(" {\n");
1992 generator.Indent();
1993 }
1994 PrintUnknownFields(field.group(), generator);
1995 if (single_line_mode_) {
1996 generator.Print("} ");
1997 } else {
1998 generator.Outdent();
1999 generator.Print("}\n");
2000 }
2001 break;
2002 }
2003 }
2004 }
2005
2006 } // namespace protobuf
2007 } // namespace google
2008