1 // Protocol Buffers - Google's data interchange format
2 // Copyright 2008 Google Inc.  All rights reserved.
3 // https://developers.google.com/protocol-buffers/
4 //
5 // Redistribution and use in source and binary forms, with or without
6 // modification, are permitted provided that the following conditions are
7 // met:
8 //
9 //     * Redistributions of source code must retain the above copyright
10 // notice, this list of conditions and the following disclaimer.
11 //     * Redistributions in binary form must reproduce the above
12 // copyright notice, this list of conditions and the following disclaimer
13 // in the documentation and/or other materials provided with the
14 // distribution.
15 //     * Neither the name of Google Inc. nor the names of its
16 // contributors may be used to endorse or promote products derived from
17 // this software without specific prior written permission.
18 //
19 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
20 // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
21 // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
22 // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
23 // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
24 // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
25 // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
26 // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
27 // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
28 // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
29 // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
30 
31 // Author: kenton@google.com (Kenton Varda)
32 //  Based on original Protocol Buffers design by
33 //  Sanjay Ghemawat, Jeff Dean, and others.
34 
35 #include <google/protobuf/stubs/hash.h>
36 #include <map>
37 #include <set>
38 #include <string>
39 #include <vector>
40 #include <algorithm>
41 #include <limits>
42 
43 #include <google/protobuf/descriptor.h>
44 #include <google/protobuf/descriptor_database.h>
45 #include <google/protobuf/descriptor.pb.h>
46 #include <google/protobuf/dynamic_message.h>
47 #include <google/protobuf/generated_message_util.h>
48 #include <google/protobuf/text_format.h>
49 #include <google/protobuf/unknown_field_set.h>
50 #include <google/protobuf/wire_format.h>
51 #include <google/protobuf/io/strtod.h>
52 #include <google/protobuf/io/coded_stream.h>
53 #include <google/protobuf/io/tokenizer.h>
54 #include <google/protobuf/io/zero_copy_stream_impl.h>
55 #include <google/protobuf/stubs/common.h>
56 #include <google/protobuf/stubs/once.h>
57 #include <google/protobuf/stubs/strutil.h>
58 #include <google/protobuf/stubs/substitute.h>
59 #include <google/protobuf/stubs/map_util.h>
60 #include <google/protobuf/stubs/stl_util.h>
61 
62 #undef PACKAGE  // autoheader #defines this.  :(
63 
64 namespace google {
65 namespace protobuf {
66 
67 const FieldDescriptor::CppType
68 FieldDescriptor::kTypeToCppTypeMap[MAX_TYPE + 1] = {
69   static_cast<CppType>(0),  // 0 is reserved for errors
70 
71   CPPTYPE_DOUBLE,   // TYPE_DOUBLE
72   CPPTYPE_FLOAT,    // TYPE_FLOAT
73   CPPTYPE_INT64,    // TYPE_INT64
74   CPPTYPE_UINT64,   // TYPE_UINT64
75   CPPTYPE_INT32,    // TYPE_INT32
76   CPPTYPE_UINT64,   // TYPE_FIXED64
77   CPPTYPE_UINT32,   // TYPE_FIXED32
78   CPPTYPE_BOOL,     // TYPE_BOOL
79   CPPTYPE_STRING,   // TYPE_STRING
80   CPPTYPE_MESSAGE,  // TYPE_GROUP
81   CPPTYPE_MESSAGE,  // TYPE_MESSAGE
82   CPPTYPE_STRING,   // TYPE_BYTES
83   CPPTYPE_UINT32,   // TYPE_UINT32
84   CPPTYPE_ENUM,     // TYPE_ENUM
85   CPPTYPE_INT32,    // TYPE_SFIXED32
86   CPPTYPE_INT64,    // TYPE_SFIXED64
87   CPPTYPE_INT32,    // TYPE_SINT32
88   CPPTYPE_INT64,    // TYPE_SINT64
89 };
90 
91 const char * const FieldDescriptor::kTypeToName[MAX_TYPE + 1] = {
92   "ERROR",     // 0 is reserved for errors
93 
94   "double",    // TYPE_DOUBLE
95   "float",     // TYPE_FLOAT
96   "int64",     // TYPE_INT64
97   "uint64",    // TYPE_UINT64
98   "int32",     // TYPE_INT32
99   "fixed64",   // TYPE_FIXED64
100   "fixed32",   // TYPE_FIXED32
101   "bool",      // TYPE_BOOL
102   "string",    // TYPE_STRING
103   "group",     // TYPE_GROUP
104   "message",   // TYPE_MESSAGE
105   "bytes",     // TYPE_BYTES
106   "uint32",    // TYPE_UINT32
107   "enum",      // TYPE_ENUM
108   "sfixed32",  // TYPE_SFIXED32
109   "sfixed64",  // TYPE_SFIXED64
110   "sint32",    // TYPE_SINT32
111   "sint64",    // TYPE_SINT64
112 };
113 
114 const char * const FieldDescriptor::kCppTypeToName[MAX_CPPTYPE + 1] = {
115   "ERROR",     // 0 is reserved for errors
116 
117   "int32",     // CPPTYPE_INT32
118   "int64",     // CPPTYPE_INT64
119   "uint32",    // CPPTYPE_UINT32
120   "uint64",    // CPPTYPE_UINT64
121   "double",    // CPPTYPE_DOUBLE
122   "float",     // CPPTYPE_FLOAT
123   "bool",      // CPPTYPE_BOOL
124   "enum",      // CPPTYPE_ENUM
125   "string",    // CPPTYPE_STRING
126   "message",   // CPPTYPE_MESSAGE
127 };
128 
129 const char * const FieldDescriptor::kLabelToName[MAX_LABEL + 1] = {
130   "ERROR",     // 0 is reserved for errors
131 
132   "optional",  // LABEL_OPTIONAL
133   "required",  // LABEL_REQUIRED
134   "repeated",  // LABEL_REPEATED
135 };
136 
137 static const char * const kNonLinkedWeakMessageReplacementName = "google.protobuf.Empty";
138 
139 #ifndef _MSC_VER  // MSVC doesn't need these and won't even accept them.
140 const int FieldDescriptor::kMaxNumber;
141 const int FieldDescriptor::kFirstReservedNumber;
142 const int FieldDescriptor::kLastReservedNumber;
143 #endif
144 
145 namespace {
146 
ToCamelCase(const string & input)147 string ToCamelCase(const string& input) {
148   bool capitalize_next = false;
149   string result;
150   result.reserve(input.size());
151 
152   for (int i = 0; i < input.size(); i++) {
153     if (input[i] == '_') {
154       capitalize_next = true;
155     } else if (capitalize_next) {
156       // Note:  I distrust ctype.h due to locales.
157       if ('a' <= input[i] && input[i] <= 'z') {
158         result.push_back(input[i] - 'a' + 'A');
159       } else {
160         result.push_back(input[i]);
161       }
162       capitalize_next = false;
163     } else {
164       result.push_back(input[i]);
165     }
166   }
167 
168   // Lower-case the first letter.
169   if (!result.empty() && 'A' <= result[0] && result[0] <= 'Z') {
170     result[0] = result[0] - 'A' + 'a';
171   }
172 
173   return result;
174 }
175 
176 // A DescriptorPool contains a bunch of hash_maps to implement the
177 // various Find*By*() methods.  Since hashtable lookups are O(1), it's
178 // most efficient to construct a fixed set of large hash_maps used by
179 // all objects in the pool rather than construct one or more small
180 // hash_maps for each object.
181 //
182 // The keys to these hash_maps are (parent, name) or (parent, number)
183 // pairs.  Unfortunately STL doesn't provide hash functions for pair<>,
184 // so we must invent our own.
185 //
186 // TODO(kenton):  Use StringPiece rather than const char* in keys?  It would
187 //   be a lot cleaner but we'd just have to convert it back to const char*
188 //   for the open source release.
189 
190 typedef pair<const void*, const char*> PointerStringPair;
191 
192 struct PointerStringPairEqual {
operator ()google::protobuf::__anond0d5fb670111::PointerStringPairEqual193   inline bool operator()(const PointerStringPair& a,
194                          const PointerStringPair& b) const {
195     return a.first == b.first && strcmp(a.second, b.second) == 0;
196   }
197 };
198 
199 template<typename PairType>
200 struct PointerIntegerPairHash {
operator ()google::protobuf::__anond0d5fb670111::PointerIntegerPairHash201   size_t operator()(const PairType& p) const {
202     // FIXME(kenton):  What is the best way to compute this hash?  I have
203     // no idea!  This seems a bit better than an XOR.
204     return reinterpret_cast<intptr_t>(p.first) * ((1 << 16) - 1) + p.second;
205   }
206 
207 #ifdef _MSC_VER
208   // Used only by MSVC and platforms where hash_map is not available.
209   static const size_t bucket_size = 4;
210   static const size_t min_buckets = 8;
211 #endif
operator ()google::protobuf::__anond0d5fb670111::PointerIntegerPairHash212   inline bool operator()(const PairType& a, const PairType& b) const {
213     return a.first < b.first ||
214           (a.first == b.first && a.second < b.second);
215   }
216 };
217 
218 typedef pair<const Descriptor*, int> DescriptorIntPair;
219 typedef pair<const EnumDescriptor*, int> EnumIntPair;
220 
221 struct PointerStringPairHash {
operator ()google::protobuf::__anond0d5fb670111::PointerStringPairHash222   size_t operator()(const PointerStringPair& p) const {
223     // FIXME(kenton):  What is the best way to compute this hash?  I have
224     // no idea!  This seems a bit better than an XOR.
225     hash<const char*> cstring_hash;
226     return reinterpret_cast<intptr_t>(p.first) * ((1 << 16) - 1) +
227            cstring_hash(p.second);
228   }
229 
230 #ifdef _MSC_VER
231   // Used only by MSVC and platforms where hash_map is not available.
232   static const size_t bucket_size = 4;
233   static const size_t min_buckets = 8;
234 #endif
operator ()google::protobuf::__anond0d5fb670111::PointerStringPairHash235   inline bool operator()(const PointerStringPair& a,
236                          const PointerStringPair& b) const {
237     if (a.first < b.first) return true;
238     if (a.first > b.first) return false;
239     return strcmp(a.second, b.second) < 0;
240   }
241 };
242 
243 
244 struct Symbol {
245   enum Type {
246     NULL_SYMBOL, MESSAGE, FIELD, ONEOF, ENUM, ENUM_VALUE, SERVICE, METHOD,
247     PACKAGE
248   };
249   Type type;
250   union {
251     const Descriptor* descriptor;
252     const FieldDescriptor* field_descriptor;
253     const OneofDescriptor* oneof_descriptor;
254     const EnumDescriptor* enum_descriptor;
255     const EnumValueDescriptor* enum_value_descriptor;
256     const ServiceDescriptor* service_descriptor;
257     const MethodDescriptor* method_descriptor;
258     const FileDescriptor* package_file_descriptor;
259   };
260 
Symbolgoogle::protobuf::__anond0d5fb670111::Symbol261   inline Symbol() : type(NULL_SYMBOL) { descriptor = NULL; }
IsNullgoogle::protobuf::__anond0d5fb670111::Symbol262   inline bool IsNull() const { return type == NULL_SYMBOL; }
IsTypegoogle::protobuf::__anond0d5fb670111::Symbol263   inline bool IsType() const {
264     return type == MESSAGE || type == ENUM;
265   }
IsAggregategoogle::protobuf::__anond0d5fb670111::Symbol266   inline bool IsAggregate() const {
267     return type == MESSAGE || type == PACKAGE
268         || type == ENUM || type == SERVICE;
269   }
270 
271 #define CONSTRUCTOR(TYPE, TYPE_CONSTANT, FIELD)  \
272   inline explicit Symbol(const TYPE* value) {    \
273     type = TYPE_CONSTANT;                        \
274     this->FIELD = value;                         \
275   }
276 
CONSTRUCTORgoogle::protobuf::__anond0d5fb670111::Symbol277   CONSTRUCTOR(Descriptor         , MESSAGE   , descriptor             )
278   CONSTRUCTOR(FieldDescriptor    , FIELD     , field_descriptor       )
279   CONSTRUCTOR(OneofDescriptor    , ONEOF     , oneof_descriptor       )
280   CONSTRUCTOR(EnumDescriptor     , ENUM      , enum_descriptor        )
281   CONSTRUCTOR(EnumValueDescriptor, ENUM_VALUE, enum_value_descriptor  )
282   CONSTRUCTOR(ServiceDescriptor  , SERVICE   , service_descriptor     )
283   CONSTRUCTOR(MethodDescriptor   , METHOD    , method_descriptor      )
284   CONSTRUCTOR(FileDescriptor     , PACKAGE   , package_file_descriptor)
285 #undef CONSTRUCTOR
286 
287   const FileDescriptor* GetFile() const {
288     switch (type) {
289       case NULL_SYMBOL: return NULL;
290       case MESSAGE    : return descriptor           ->file();
291       case FIELD      : return field_descriptor     ->file();
292       case ONEOF      : return oneof_descriptor     ->containing_type()->file();
293       case ENUM       : return enum_descriptor      ->file();
294       case ENUM_VALUE : return enum_value_descriptor->type()->file();
295       case SERVICE    : return service_descriptor   ->file();
296       case METHOD     : return method_descriptor    ->service()->file();
297       case PACKAGE    : return package_file_descriptor;
298     }
299     return NULL;
300   }
301 };
302 
303 const Symbol kNullSymbol;
304 
305 typedef hash_map<const char*, Symbol,
306                  hash<const char*>, streq>
307   SymbolsByNameMap;
308 typedef hash_map<PointerStringPair, Symbol,
309                  PointerStringPairHash, PointerStringPairEqual>
310   SymbolsByParentMap;
311 typedef hash_map<const char*, const FileDescriptor*,
312                  hash<const char*>, streq>
313   FilesByNameMap;
314 typedef hash_map<PointerStringPair, const FieldDescriptor*,
315                  PointerStringPairHash, PointerStringPairEqual>
316   FieldsByNameMap;
317 typedef hash_map<DescriptorIntPair, const FieldDescriptor*,
318                  PointerIntegerPairHash<DescriptorIntPair> >
319   FieldsByNumberMap;
320 typedef hash_map<EnumIntPair, const EnumValueDescriptor*,
321                  PointerIntegerPairHash<EnumIntPair> >
322   EnumValuesByNumberMap;
323 // This is a map rather than a hash_map, since we use it to iterate
324 // through all the extensions that extend a given Descriptor, and an
325 // ordered data structure that implements lower_bound is convenient
326 // for that.
327 typedef map<DescriptorIntPair, const FieldDescriptor*>
328   ExtensionsGroupedByDescriptorMap;
329 typedef hash_map<string, const SourceCodeInfo_Location*> LocationsByPathMap;
330 }  // anonymous namespace
331 
332 // ===================================================================
333 // DescriptorPool::Tables
334 
335 class DescriptorPool::Tables {
336  public:
337   Tables();
338   ~Tables();
339 
340   // Record the current state of the tables to the stack of checkpoints.
341   // Each call to AddCheckpoint() must be paired with exactly one call to either
342   // ClearLastCheckpoint() or RollbackToLastCheckpoint().
343   //
344   // This is used when building files, since some kinds of validation errors
345   // cannot be detected until the file's descriptors have already been added to
346   // the tables.
347   //
348   // This supports recursive checkpoints, since building a file may trigger
349   // recursive building of other files. Note that recursive checkpoints are not
350   // normally necessary; explicit dependencies are built prior to checkpointing.
351   // So although we recursively build transitive imports, there is at most one
352   // checkpoint in the stack during dependency building.
353   //
354   // Recursive checkpoints only arise during cross-linking of the descriptors.
355   // Symbol references must be resolved, via DescriptorBuilder::FindSymbol and
356   // friends. If the pending file references an unknown symbol
357   // (e.g., it is not defined in the pending file's explicit dependencies), and
358   // the pool is using a fallback database, and that database contains a file
359   // defining that symbol, and that file has not yet been built by the pool,
360   // the pool builds the file during cross-linking, leading to another
361   // checkpoint.
362   void AddCheckpoint();
363 
364   // Mark the last checkpoint as having cleared successfully, removing it from
365   // the stack. If the stack is empty, all pending symbols will be committed.
366   //
367   // Note that this does not guarantee that the symbols added since the last
368   // checkpoint won't be rolled back: if a checkpoint gets rolled back,
369   // everything past that point gets rolled back, including symbols added after
370   // checkpoints that were pushed onto the stack after it and marked as cleared.
371   void ClearLastCheckpoint();
372 
373   // Roll back the Tables to the state of the checkpoint at the top of the
374   // stack, removing everything that was added after that point.
375   void RollbackToLastCheckpoint();
376 
377   // The stack of files which are currently being built.  Used to detect
378   // cyclic dependencies when loading files from a DescriptorDatabase.  Not
379   // used when fallback_database_ == NULL.
380   vector<string> pending_files_;
381 
382   // A set of files which we have tried to load from the fallback database
383   // and encountered errors.  We will not attempt to load them again during
384   // execution of the current public API call, but for compatibility with
385   // legacy clients, this is cleared at the beginning of each public API call.
386   // Not used when fallback_database_ == NULL.
387   hash_set<string> known_bad_files_;
388 
389   // A set of symbols which we have tried to load from the fallback database
390   // and encountered errors. We will not attempt to load them again during
391   // execution of the current public API call, but for compatibility with
392   // legacy clients, this is cleared at the beginning of each public API call.
393   hash_set<string> known_bad_symbols_;
394 
395   // The set of descriptors for which we've already loaded the full
396   // set of extensions numbers from fallback_database_.
397   hash_set<const Descriptor*> extensions_loaded_from_db_;
398 
399   // -----------------------------------------------------------------
400   // Finding items.
401 
402   // Find symbols.  This returns a null Symbol (symbol.IsNull() is true)
403   // if not found.
404   inline Symbol FindSymbol(const string& key) const;
405 
406   // This implements the body of DescriptorPool::Find*ByName().  It should
407   // really be a private method of DescriptorPool, but that would require
408   // declaring Symbol in descriptor.h, which would drag all kinds of other
409   // stuff into the header.  Yay C++.
410   Symbol FindByNameHelper(
411     const DescriptorPool* pool, const string& name);
412 
413   // These return NULL if not found.
414   inline const FileDescriptor* FindFile(const string& key) const;
415   inline const FieldDescriptor* FindExtension(const Descriptor* extendee,
416                                               int number);
417   inline void FindAllExtensions(const Descriptor* extendee,
418                                 vector<const FieldDescriptor*>* out) const;
419 
420   // -----------------------------------------------------------------
421   // Adding items.
422 
423   // These add items to the corresponding tables.  They return false if
424   // the key already exists in the table.  For AddSymbol(), the string passed
425   // in must be one that was constructed using AllocateString(), as it will
426   // be used as a key in the symbols_by_name_ map without copying.
427   bool AddSymbol(const string& full_name, Symbol symbol);
428   bool AddFile(const FileDescriptor* file);
429   bool AddExtension(const FieldDescriptor* field);
430 
431   // -----------------------------------------------------------------
432   // Allocating memory.
433 
434   // Allocate an object which will be reclaimed when the pool is
435   // destroyed.  Note that the object's destructor will never be called,
436   // so its fields must be plain old data (primitive data types and
437   // pointers).  All of the descriptor types are such objects.
438   template<typename Type> Type* Allocate();
439 
440   // Allocate an array of objects which will be reclaimed when the
441   // pool in destroyed.  Again, destructors are never called.
442   template<typename Type> Type* AllocateArray(int count);
443 
444   // Allocate a string which will be destroyed when the pool is destroyed.
445   // The string is initialized to the given value for convenience.
446   string* AllocateString(const string& value);
447 
448   // Allocate a protocol message object.  Some older versions of GCC have
449   // trouble understanding explicit template instantiations in some cases, so
450   // in those cases we have to pass a dummy pointer of the right type as the
451   // parameter instead of specifying the type explicitly.
452   template<typename Type> Type* AllocateMessage(Type* dummy = NULL);
453 
454   // Allocate a FileDescriptorTables object.
455   FileDescriptorTables* AllocateFileTables();
456 
457  private:
458   vector<string*> strings_;    // All strings in the pool.
459   vector<Message*> messages_;  // All messages in the pool.
460   vector<FileDescriptorTables*> file_tables_;  // All file tables in the pool.
461   vector<void*> allocations_;  // All other memory allocated in the pool.
462 
463   SymbolsByNameMap      symbols_by_name_;
464   FilesByNameMap        files_by_name_;
465   ExtensionsGroupedByDescriptorMap extensions_;
466 
467   struct CheckPoint {
CheckPointgoogle::protobuf::DescriptorPool::Tables::CheckPoint468     explicit CheckPoint(const Tables* tables)
469       : strings_before_checkpoint(tables->strings_.size()),
470         messages_before_checkpoint(tables->messages_.size()),
471         file_tables_before_checkpoint(tables->file_tables_.size()),
472         allocations_before_checkpoint(tables->allocations_.size()),
473         pending_symbols_before_checkpoint(
474             tables->symbols_after_checkpoint_.size()),
475         pending_files_before_checkpoint(
476             tables->files_after_checkpoint_.size()),
477         pending_extensions_before_checkpoint(
478             tables->extensions_after_checkpoint_.size()) {
479     }
480     int strings_before_checkpoint;
481     int messages_before_checkpoint;
482     int file_tables_before_checkpoint;
483     int allocations_before_checkpoint;
484     int pending_symbols_before_checkpoint;
485     int pending_files_before_checkpoint;
486     int pending_extensions_before_checkpoint;
487   };
488   vector<CheckPoint> checkpoints_;
489   vector<const char*      > symbols_after_checkpoint_;
490   vector<const char*      > files_after_checkpoint_;
491   vector<DescriptorIntPair> extensions_after_checkpoint_;
492 
493   // Allocate some bytes which will be reclaimed when the pool is
494   // destroyed.
495   void* AllocateBytes(int size);
496 };
497 
498 // Contains tables specific to a particular file.  These tables are not
499 // modified once the file has been constructed, so they need not be
500 // protected by a mutex.  This makes operations that depend only on the
501 // contents of a single file -- e.g. Descriptor::FindFieldByName() --
502 // lock-free.
503 //
504 // For historical reasons, the definitions of the methods of
505 // FileDescriptorTables and DescriptorPool::Tables are interleaved below.
506 // These used to be a single class.
507 class FileDescriptorTables {
508  public:
509   FileDescriptorTables();
510   ~FileDescriptorTables();
511 
512   // Empty table, used with placeholder files.
513   static const FileDescriptorTables kEmpty;
514 
515   // -----------------------------------------------------------------
516   // Finding items.
517 
518   // Find symbols.  These return a null Symbol (symbol.IsNull() is true)
519   // if not found.
520   inline Symbol FindNestedSymbol(const void* parent,
521                                  const string& name) const;
522   inline Symbol FindNestedSymbolOfType(const void* parent,
523                                        const string& name,
524                                        const Symbol::Type type) const;
525 
526   // These return NULL if not found.
527   inline const FieldDescriptor* FindFieldByNumber(
528     const Descriptor* parent, int number) const;
529   inline const FieldDescriptor* FindFieldByLowercaseName(
530     const void* parent, const string& lowercase_name) const;
531   inline const FieldDescriptor* FindFieldByCamelcaseName(
532     const void* parent, const string& camelcase_name) const;
533   inline const EnumValueDescriptor* FindEnumValueByNumber(
534     const EnumDescriptor* parent, int number) const;
535 
536   // -----------------------------------------------------------------
537   // Adding items.
538 
539   // These add items to the corresponding tables.  They return false if
540   // the key already exists in the table.  For AddAliasUnderParent(), the
541   // string passed in must be one that was constructed using AllocateString(),
542   // as it will be used as a key in the symbols_by_parent_ map without copying.
543   bool AddAliasUnderParent(const void* parent, const string& name,
544                            Symbol symbol);
545   bool AddFieldByNumber(const FieldDescriptor* field);
546   bool AddEnumValueByNumber(const EnumValueDescriptor* value);
547 
548   // Adds the field to the lowercase_name and camelcase_name maps.  Never
549   // fails because we allow duplicates; the first field by the name wins.
550   void AddFieldByStylizedNames(const FieldDescriptor* field);
551 
552   // Populates p->first->locations_by_path_ from p->second.
553   // Unusual signature dictated by GoogleOnceDynamic.
554   static void BuildLocationsByPath(
555       pair<const FileDescriptorTables*, const SourceCodeInfo*>* p);
556 
557   // Returns the location denoted by the specified path through info,
558   // or NULL if not found.
559   // The value of info must be that of the corresponding FileDescriptor.
560   // (Conceptually a pure function, but stateful as an optimisation.)
561   const SourceCodeInfo_Location* GetSourceLocation(
562       const vector<int>& path, const SourceCodeInfo* info) const;
563 
564  private:
565   SymbolsByParentMap    symbols_by_parent_;
566   FieldsByNameMap       fields_by_lowercase_name_;
567   FieldsByNameMap       fields_by_camelcase_name_;
568   FieldsByNumberMap     fields_by_number_;       // Not including extensions.
569   EnumValuesByNumberMap enum_values_by_number_;
570 
571   // Populated on first request to save space, hence constness games.
572   mutable GoogleOnceDynamic locations_by_path_once_;
573   mutable LocationsByPathMap locations_by_path_;
574 };
575 
Tables()576 DescriptorPool::Tables::Tables()
577     // Start some hash_map and hash_set objects with a small # of buckets
578     : known_bad_files_(3),
579       known_bad_symbols_(3),
580       extensions_loaded_from_db_(3),
581       symbols_by_name_(3),
582       files_by_name_(3) {}
583 
584 
~Tables()585 DescriptorPool::Tables::~Tables() {
586   GOOGLE_DCHECK(checkpoints_.empty());
587   // Note that the deletion order is important, since the destructors of some
588   // messages may refer to objects in allocations_.
589   STLDeleteElements(&messages_);
590   for (int i = 0; i < allocations_.size(); i++) {
591     operator delete(allocations_[i]);
592   }
593   STLDeleteElements(&strings_);
594   STLDeleteElements(&file_tables_);
595 }
596 
FileDescriptorTables()597 FileDescriptorTables::FileDescriptorTables()
598     // Initialize all the hash tables to start out with a small # of buckets
599     : symbols_by_parent_(3),
600       fields_by_lowercase_name_(3),
601       fields_by_camelcase_name_(3),
602       fields_by_number_(3),
603       enum_values_by_number_(3) {
604 }
605 
~FileDescriptorTables()606 FileDescriptorTables::~FileDescriptorTables() {}
607 
608 const FileDescriptorTables FileDescriptorTables::kEmpty;
609 
AddCheckpoint()610 void DescriptorPool::Tables::AddCheckpoint() {
611   checkpoints_.push_back(CheckPoint(this));
612 }
613 
ClearLastCheckpoint()614 void DescriptorPool::Tables::ClearLastCheckpoint() {
615   GOOGLE_DCHECK(!checkpoints_.empty());
616   checkpoints_.pop_back();
617   if (checkpoints_.empty()) {
618     // All checkpoints have been cleared: we can now commit all of the pending
619     // data.
620     symbols_after_checkpoint_.clear();
621     files_after_checkpoint_.clear();
622     extensions_after_checkpoint_.clear();
623   }
624 }
625 
RollbackToLastCheckpoint()626 void DescriptorPool::Tables::RollbackToLastCheckpoint() {
627   GOOGLE_DCHECK(!checkpoints_.empty());
628   const CheckPoint& checkpoint = checkpoints_.back();
629 
630   for (int i = checkpoint.pending_symbols_before_checkpoint;
631        i < symbols_after_checkpoint_.size();
632        i++) {
633     symbols_by_name_.erase(symbols_after_checkpoint_[i]);
634   }
635   for (int i = checkpoint.pending_files_before_checkpoint;
636        i < files_after_checkpoint_.size();
637        i++) {
638     files_by_name_.erase(files_after_checkpoint_[i]);
639   }
640   for (int i = checkpoint.pending_extensions_before_checkpoint;
641        i < extensions_after_checkpoint_.size();
642        i++) {
643     extensions_.erase(extensions_after_checkpoint_[i]);
644   }
645 
646   symbols_after_checkpoint_.resize(
647       checkpoint.pending_symbols_before_checkpoint);
648   files_after_checkpoint_.resize(checkpoint.pending_files_before_checkpoint);
649   extensions_after_checkpoint_.resize(
650       checkpoint.pending_extensions_before_checkpoint);
651 
652   STLDeleteContainerPointers(
653       strings_.begin() + checkpoint.strings_before_checkpoint, strings_.end());
654   STLDeleteContainerPointers(
655       messages_.begin() + checkpoint.messages_before_checkpoint,
656       messages_.end());
657   STLDeleteContainerPointers(
658       file_tables_.begin() + checkpoint.file_tables_before_checkpoint,
659       file_tables_.end());
660   for (int i = checkpoint.allocations_before_checkpoint;
661        i < allocations_.size();
662        i++) {
663     operator delete(allocations_[i]);
664   }
665 
666   strings_.resize(checkpoint.strings_before_checkpoint);
667   messages_.resize(checkpoint.messages_before_checkpoint);
668   file_tables_.resize(checkpoint.file_tables_before_checkpoint);
669   allocations_.resize(checkpoint.allocations_before_checkpoint);
670   checkpoints_.pop_back();
671 }
672 
673 // -------------------------------------------------------------------
674 
FindSymbol(const string & key) const675 inline Symbol DescriptorPool::Tables::FindSymbol(const string& key) const {
676   const Symbol* result = FindOrNull(symbols_by_name_, key.c_str());
677   if (result == NULL) {
678     return kNullSymbol;
679   } else {
680     return *result;
681   }
682 }
683 
FindNestedSymbol(const void * parent,const string & name) const684 inline Symbol FileDescriptorTables::FindNestedSymbol(
685     const void* parent, const string& name) const {
686   const Symbol* result =
687     FindOrNull(symbols_by_parent_, PointerStringPair(parent, name.c_str()));
688   if (result == NULL) {
689     return kNullSymbol;
690   } else {
691     return *result;
692   }
693 }
694 
FindNestedSymbolOfType(const void * parent,const string & name,const Symbol::Type type) const695 inline Symbol FileDescriptorTables::FindNestedSymbolOfType(
696     const void* parent, const string& name, const Symbol::Type type) const {
697   Symbol result = FindNestedSymbol(parent, name);
698   if (result.type != type) return kNullSymbol;
699   return result;
700 }
701 
FindByNameHelper(const DescriptorPool * pool,const string & name)702 Symbol DescriptorPool::Tables::FindByNameHelper(
703     const DescriptorPool* pool, const string& name) {
704   MutexLockMaybe lock(pool->mutex_);
705   known_bad_symbols_.clear();
706   known_bad_files_.clear();
707   Symbol result = FindSymbol(name);
708 
709   if (result.IsNull() && pool->underlay_ != NULL) {
710     // Symbol not found; check the underlay.
711     result =
712       pool->underlay_->tables_->FindByNameHelper(pool->underlay_, name);
713   }
714 
715   if (result.IsNull()) {
716     // Symbol still not found, so check fallback database.
717     if (pool->TryFindSymbolInFallbackDatabase(name)) {
718       result = FindSymbol(name);
719     }
720   }
721 
722   return result;
723 }
724 
FindFile(const string & key) const725 inline const FileDescriptor* DescriptorPool::Tables::FindFile(
726     const string& key) const {
727   return FindPtrOrNull(files_by_name_, key.c_str());
728 }
729 
FindFieldByNumber(const Descriptor * parent,int number) const730 inline const FieldDescriptor* FileDescriptorTables::FindFieldByNumber(
731     const Descriptor* parent, int number) const {
732   return FindPtrOrNull(fields_by_number_, make_pair(parent, number));
733 }
734 
FindFieldByLowercaseName(const void * parent,const string & lowercase_name) const735 inline const FieldDescriptor* FileDescriptorTables::FindFieldByLowercaseName(
736     const void* parent, const string& lowercase_name) const {
737   return FindPtrOrNull(fields_by_lowercase_name_,
738                        PointerStringPair(parent, lowercase_name.c_str()));
739 }
740 
FindFieldByCamelcaseName(const void * parent,const string & camelcase_name) const741 inline const FieldDescriptor* FileDescriptorTables::FindFieldByCamelcaseName(
742     const void* parent, const string& camelcase_name) const {
743   return FindPtrOrNull(fields_by_camelcase_name_,
744                        PointerStringPair(parent, camelcase_name.c_str()));
745 }
746 
FindEnumValueByNumber(const EnumDescriptor * parent,int number) const747 inline const EnumValueDescriptor* FileDescriptorTables::FindEnumValueByNumber(
748     const EnumDescriptor* parent, int number) const {
749   return FindPtrOrNull(enum_values_by_number_, make_pair(parent, number));
750 }
751 
FindExtension(const Descriptor * extendee,int number)752 inline const FieldDescriptor* DescriptorPool::Tables::FindExtension(
753     const Descriptor* extendee, int number) {
754   return FindPtrOrNull(extensions_, make_pair(extendee, number));
755 }
756 
FindAllExtensions(const Descriptor * extendee,vector<const FieldDescriptor * > * out) const757 inline void DescriptorPool::Tables::FindAllExtensions(
758     const Descriptor* extendee, vector<const FieldDescriptor*>* out) const {
759   ExtensionsGroupedByDescriptorMap::const_iterator it =
760       extensions_.lower_bound(make_pair(extendee, 0));
761   for (; it != extensions_.end() && it->first.first == extendee; ++it) {
762     out->push_back(it->second);
763   }
764 }
765 
766 // -------------------------------------------------------------------
767 
AddSymbol(const string & full_name,Symbol symbol)768 bool DescriptorPool::Tables::AddSymbol(
769     const string& full_name, Symbol symbol) {
770   if (InsertIfNotPresent(&symbols_by_name_, full_name.c_str(), symbol)) {
771     symbols_after_checkpoint_.push_back(full_name.c_str());
772     return true;
773   } else {
774     return false;
775   }
776 }
777 
AddAliasUnderParent(const void * parent,const string & name,Symbol symbol)778 bool FileDescriptorTables::AddAliasUnderParent(
779     const void* parent, const string& name, Symbol symbol) {
780   PointerStringPair by_parent_key(parent, name.c_str());
781   return InsertIfNotPresent(&symbols_by_parent_, by_parent_key, symbol);
782 }
783 
AddFile(const FileDescriptor * file)784 bool DescriptorPool::Tables::AddFile(const FileDescriptor* file) {
785   if (InsertIfNotPresent(&files_by_name_, file->name().c_str(), file)) {
786     files_after_checkpoint_.push_back(file->name().c_str());
787     return true;
788   } else {
789     return false;
790   }
791 }
792 
AddFieldByStylizedNames(const FieldDescriptor * field)793 void FileDescriptorTables::AddFieldByStylizedNames(
794     const FieldDescriptor* field) {
795   const void* parent;
796   if (field->is_extension()) {
797     if (field->extension_scope() == NULL) {
798       parent = field->file();
799     } else {
800       parent = field->extension_scope();
801     }
802   } else {
803     parent = field->containing_type();
804   }
805 
806   PointerStringPair lowercase_key(parent, field->lowercase_name().c_str());
807   InsertIfNotPresent(&fields_by_lowercase_name_, lowercase_key, field);
808 
809   PointerStringPair camelcase_key(parent, field->camelcase_name().c_str());
810   InsertIfNotPresent(&fields_by_camelcase_name_, camelcase_key, field);
811 }
812 
AddFieldByNumber(const FieldDescriptor * field)813 bool FileDescriptorTables::AddFieldByNumber(const FieldDescriptor* field) {
814   DescriptorIntPair key(field->containing_type(), field->number());
815   return InsertIfNotPresent(&fields_by_number_, key, field);
816 }
817 
AddEnumValueByNumber(const EnumValueDescriptor * value)818 bool FileDescriptorTables::AddEnumValueByNumber(
819     const EnumValueDescriptor* value) {
820   EnumIntPair key(value->type(), value->number());
821   return InsertIfNotPresent(&enum_values_by_number_, key, value);
822 }
823 
AddExtension(const FieldDescriptor * field)824 bool DescriptorPool::Tables::AddExtension(const FieldDescriptor* field) {
825   DescriptorIntPair key(field->containing_type(), field->number());
826   if (InsertIfNotPresent(&extensions_, key, field)) {
827     extensions_after_checkpoint_.push_back(key);
828     return true;
829   } else {
830     return false;
831   }
832 }
833 
834 // -------------------------------------------------------------------
835 
836 template<typename Type>
Allocate()837 Type* DescriptorPool::Tables::Allocate() {
838   return reinterpret_cast<Type*>(AllocateBytes(sizeof(Type)));
839 }
840 
841 template<typename Type>
AllocateArray(int count)842 Type* DescriptorPool::Tables::AllocateArray(int count) {
843   return reinterpret_cast<Type*>(AllocateBytes(sizeof(Type) * count));
844 }
845 
AllocateString(const string & value)846 string* DescriptorPool::Tables::AllocateString(const string& value) {
847   string* result = new string(value);
848   strings_.push_back(result);
849   return result;
850 }
851 
852 template<typename Type>
AllocateMessage(Type *)853 Type* DescriptorPool::Tables::AllocateMessage(Type* /* dummy */) {
854   Type* result = new Type;
855   messages_.push_back(result);
856   return result;
857 }
858 
AllocateFileTables()859 FileDescriptorTables* DescriptorPool::Tables::AllocateFileTables() {
860   FileDescriptorTables* result = new FileDescriptorTables;
861   file_tables_.push_back(result);
862   return result;
863 }
864 
AllocateBytes(int size)865 void* DescriptorPool::Tables::AllocateBytes(int size) {
866   // TODO(kenton):  Would it be worthwhile to implement this in some more
867   // sophisticated way?  Probably not for the open source release, but for
868   // internal use we could easily plug in one of our existing memory pool
869   // allocators...
870   if (size == 0) return NULL;
871 
872   void* result = operator new(size);
873   allocations_.push_back(result);
874   return result;
875 }
876 
BuildLocationsByPath(pair<const FileDescriptorTables *,const SourceCodeInfo * > * p)877 void FileDescriptorTables::BuildLocationsByPath(
878     pair<const FileDescriptorTables*, const SourceCodeInfo*>* p) {
879   for (int i = 0, len = p->second->location_size(); i < len; ++i) {
880     const SourceCodeInfo_Location* loc = &p->second->location().Get(i);
881     p->first->locations_by_path_[Join(loc->path(), ",")] = loc;
882   }
883 }
884 
GetSourceLocation(const vector<int> & path,const SourceCodeInfo * info) const885 const SourceCodeInfo_Location* FileDescriptorTables::GetSourceLocation(
886     const vector<int>& path, const SourceCodeInfo* info) const {
887   pair<const FileDescriptorTables*, const SourceCodeInfo*> p(
888       make_pair(this, info));
889   locations_by_path_once_.Init(&FileDescriptorTables::BuildLocationsByPath, &p);
890   return FindPtrOrNull(locations_by_path_, Join(path, ","));
891 }
892 
893 // ===================================================================
894 // DescriptorPool
895 
~ErrorCollector()896 DescriptorPool::ErrorCollector::~ErrorCollector() {}
897 
DescriptorPool()898 DescriptorPool::DescriptorPool()
899   : mutex_(NULL),
900     fallback_database_(NULL),
901     default_error_collector_(NULL),
902     underlay_(NULL),
903     tables_(new Tables),
904     enforce_dependencies_(true),
905     allow_unknown_(false),
906     enforce_weak_(false) {}
907 
DescriptorPool(DescriptorDatabase * fallback_database,ErrorCollector * error_collector)908 DescriptorPool::DescriptorPool(DescriptorDatabase* fallback_database,
909                                ErrorCollector* error_collector)
910   : mutex_(new Mutex),
911     fallback_database_(fallback_database),
912     default_error_collector_(error_collector),
913     underlay_(NULL),
914     tables_(new Tables),
915     enforce_dependencies_(true),
916     allow_unknown_(false),
917     enforce_weak_(false) {
918 }
919 
DescriptorPool(const DescriptorPool * underlay)920 DescriptorPool::DescriptorPool(const DescriptorPool* underlay)
921   : mutex_(NULL),
922     fallback_database_(NULL),
923     default_error_collector_(NULL),
924     underlay_(underlay),
925     tables_(new Tables),
926     enforce_dependencies_(true),
927     allow_unknown_(false),
928     enforce_weak_(false) {}
929 
~DescriptorPool()930 DescriptorPool::~DescriptorPool() {
931   if (mutex_ != NULL) delete mutex_;
932 }
933 
934 // DescriptorPool::BuildFile() defined later.
935 // DescriptorPool::BuildFileCollectingErrors() defined later.
936 
InternalDontEnforceDependencies()937 void DescriptorPool::InternalDontEnforceDependencies() {
938   enforce_dependencies_ = false;
939 }
940 
AddUnusedImportTrackFile(const string & file_name)941 void DescriptorPool::AddUnusedImportTrackFile(const string& file_name) {
942   unused_import_track_files_.insert(file_name);
943 }
944 
ClearUnusedImportTrackFiles()945 void DescriptorPool::ClearUnusedImportTrackFiles() {
946   unused_import_track_files_.clear();
947 }
948 
InternalIsFileLoaded(const string & filename) const949 bool DescriptorPool::InternalIsFileLoaded(const string& filename) const {
950   MutexLockMaybe lock(mutex_);
951   return tables_->FindFile(filename) != NULL;
952 }
953 
954 // generated_pool ====================================================
955 
956 namespace {
957 
958 
959 EncodedDescriptorDatabase* generated_database_ = NULL;
960 DescriptorPool* generated_pool_ = NULL;
961 GOOGLE_PROTOBUF_DECLARE_ONCE(generated_pool_init_);
962 
DeleteGeneratedPool()963 void DeleteGeneratedPool() {
964   delete generated_database_;
965   generated_database_ = NULL;
966   delete generated_pool_;
967   generated_pool_ = NULL;
968 }
969 
InitGeneratedPool()970 static void InitGeneratedPool() {
971   generated_database_ = new EncodedDescriptorDatabase;
972   generated_pool_ = new DescriptorPool(generated_database_);
973 
974   internal::OnShutdown(&DeleteGeneratedPool);
975 }
976 
InitGeneratedPoolOnce()977 inline void InitGeneratedPoolOnce() {
978   ::google::protobuf::GoogleOnceInit(&generated_pool_init_, &InitGeneratedPool);
979 }
980 
981 }  // anonymous namespace
982 
generated_pool()983 const DescriptorPool* DescriptorPool::generated_pool() {
984   InitGeneratedPoolOnce();
985   return generated_pool_;
986 }
987 
internal_generated_pool()988 DescriptorPool* DescriptorPool::internal_generated_pool() {
989   InitGeneratedPoolOnce();
990   return generated_pool_;
991 }
992 
InternalAddGeneratedFile(const void * encoded_file_descriptor,int size)993 void DescriptorPool::InternalAddGeneratedFile(
994     const void* encoded_file_descriptor, int size) {
995   // So, this function is called in the process of initializing the
996   // descriptors for generated proto classes.  Each generated .pb.cc file
997   // has an internal procedure called AddDescriptors() which is called at
998   // process startup, and that function calls this one in order to register
999   // the raw bytes of the FileDescriptorProto representing the file.
1000   //
1001   // We do not actually construct the descriptor objects right away.  We just
1002   // hang on to the bytes until they are actually needed.  We actually construct
1003   // the descriptor the first time one of the following things happens:
1004   // * Someone calls a method like descriptor(), GetDescriptor(), or
1005   //   GetReflection() on the generated types, which requires returning the
1006   //   descriptor or an object based on it.
1007   // * Someone looks up the descriptor in DescriptorPool::generated_pool().
1008   //
1009   // Once one of these happens, the DescriptorPool actually parses the
1010   // FileDescriptorProto and generates a FileDescriptor (and all its children)
1011   // based on it.
1012   //
1013   // Note that FileDescriptorProto is itself a generated protocol message.
1014   // Therefore, when we parse one, we have to be very careful to avoid using
1015   // any descriptor-based operations, since this might cause infinite recursion
1016   // or deadlock.
1017   InitGeneratedPoolOnce();
1018   GOOGLE_CHECK(generated_database_->Add(encoded_file_descriptor, size));
1019 }
1020 
1021 
1022 // Find*By* methods ==================================================
1023 
1024 // TODO(kenton):  There's a lot of repeated code here, but I'm not sure if
1025 //   there's any good way to factor it out.  Think about this some time when
1026 //   there's nothing more important to do (read: never).
1027 
FindFileByName(const string & name) const1028 const FileDescriptor* DescriptorPool::FindFileByName(const string& name) const {
1029   MutexLockMaybe lock(mutex_);
1030   tables_->known_bad_symbols_.clear();
1031   tables_->known_bad_files_.clear();
1032   const FileDescriptor* result = tables_->FindFile(name);
1033   if (result != NULL) return result;
1034   if (underlay_ != NULL) {
1035     result = underlay_->FindFileByName(name);
1036     if (result != NULL) return result;
1037   }
1038   if (TryFindFileInFallbackDatabase(name)) {
1039     result = tables_->FindFile(name);
1040     if (result != NULL) return result;
1041   }
1042   return NULL;
1043 }
1044 
FindFileContainingSymbol(const string & symbol_name) const1045 const FileDescriptor* DescriptorPool::FindFileContainingSymbol(
1046     const string& symbol_name) const {
1047   MutexLockMaybe lock(mutex_);
1048   tables_->known_bad_symbols_.clear();
1049   tables_->known_bad_files_.clear();
1050   Symbol result = tables_->FindSymbol(symbol_name);
1051   if (!result.IsNull()) return result.GetFile();
1052   if (underlay_ != NULL) {
1053     const FileDescriptor* file_result =
1054       underlay_->FindFileContainingSymbol(symbol_name);
1055     if (file_result != NULL) return file_result;
1056   }
1057   if (TryFindSymbolInFallbackDatabase(symbol_name)) {
1058     result = tables_->FindSymbol(symbol_name);
1059     if (!result.IsNull()) return result.GetFile();
1060   }
1061   return NULL;
1062 }
1063 
FindMessageTypeByName(const string & name) const1064 const Descriptor* DescriptorPool::FindMessageTypeByName(
1065     const string& name) const {
1066   Symbol result = tables_->FindByNameHelper(this, name);
1067   return (result.type == Symbol::MESSAGE) ? result.descriptor : NULL;
1068 }
1069 
FindFieldByName(const string & name) const1070 const FieldDescriptor* DescriptorPool::FindFieldByName(
1071     const string& name) const {
1072   Symbol result = tables_->FindByNameHelper(this, name);
1073   if (result.type == Symbol::FIELD &&
1074       !result.field_descriptor->is_extension()) {
1075     return result.field_descriptor;
1076   } else {
1077     return NULL;
1078   }
1079 }
1080 
FindExtensionByName(const string & name) const1081 const FieldDescriptor* DescriptorPool::FindExtensionByName(
1082     const string& name) const {
1083   Symbol result = tables_->FindByNameHelper(this, name);
1084   if (result.type == Symbol::FIELD &&
1085       result.field_descriptor->is_extension()) {
1086     return result.field_descriptor;
1087   } else {
1088     return NULL;
1089   }
1090 }
1091 
FindOneofByName(const string & name) const1092 const OneofDescriptor* DescriptorPool::FindOneofByName(
1093     const string& name) const {
1094   Symbol result = tables_->FindByNameHelper(this, name);
1095   return (result.type == Symbol::ONEOF) ? result.oneof_descriptor : NULL;
1096 }
1097 
FindEnumTypeByName(const string & name) const1098 const EnumDescriptor* DescriptorPool::FindEnumTypeByName(
1099     const string& name) const {
1100   Symbol result = tables_->FindByNameHelper(this, name);
1101   return (result.type == Symbol::ENUM) ? result.enum_descriptor : NULL;
1102 }
1103 
FindEnumValueByName(const string & name) const1104 const EnumValueDescriptor* DescriptorPool::FindEnumValueByName(
1105     const string& name) const {
1106   Symbol result = tables_->FindByNameHelper(this, name);
1107   return (result.type == Symbol::ENUM_VALUE) ?
1108     result.enum_value_descriptor : NULL;
1109 }
1110 
FindServiceByName(const string & name) const1111 const ServiceDescriptor* DescriptorPool::FindServiceByName(
1112     const string& name) const {
1113   Symbol result = tables_->FindByNameHelper(this, name);
1114   return (result.type == Symbol::SERVICE) ? result.service_descriptor : NULL;
1115 }
1116 
FindMethodByName(const string & name) const1117 const MethodDescriptor* DescriptorPool::FindMethodByName(
1118     const string& name) const {
1119   Symbol result = tables_->FindByNameHelper(this, name);
1120   return (result.type == Symbol::METHOD) ? result.method_descriptor : NULL;
1121 }
1122 
FindExtensionByNumber(const Descriptor * extendee,int number) const1123 const FieldDescriptor* DescriptorPool::FindExtensionByNumber(
1124     const Descriptor* extendee, int number) const {
1125   MutexLockMaybe lock(mutex_);
1126   tables_->known_bad_symbols_.clear();
1127   tables_->known_bad_files_.clear();
1128   const FieldDescriptor* result = tables_->FindExtension(extendee, number);
1129   if (result != NULL) {
1130     return result;
1131   }
1132   if (underlay_ != NULL) {
1133     result = underlay_->FindExtensionByNumber(extendee, number);
1134     if (result != NULL) return result;
1135   }
1136   if (TryFindExtensionInFallbackDatabase(extendee, number)) {
1137     result = tables_->FindExtension(extendee, number);
1138     if (result != NULL) {
1139       return result;
1140     }
1141   }
1142   return NULL;
1143 }
1144 
FindAllExtensions(const Descriptor * extendee,vector<const FieldDescriptor * > * out) const1145 void DescriptorPool::FindAllExtensions(
1146     const Descriptor* extendee, vector<const FieldDescriptor*>* out) const {
1147   MutexLockMaybe lock(mutex_);
1148   tables_->known_bad_symbols_.clear();
1149   tables_->known_bad_files_.clear();
1150 
1151   // Initialize tables_->extensions_ from the fallback database first
1152   // (but do this only once per descriptor).
1153   if (fallback_database_ != NULL &&
1154       tables_->extensions_loaded_from_db_.count(extendee) == 0) {
1155     vector<int> numbers;
1156     if (fallback_database_->FindAllExtensionNumbers(extendee->full_name(),
1157                                                     &numbers)) {
1158       for (int i = 0; i < numbers.size(); ++i) {
1159         int number = numbers[i];
1160         if (tables_->FindExtension(extendee, number) == NULL) {
1161           TryFindExtensionInFallbackDatabase(extendee, number);
1162         }
1163       }
1164       tables_->extensions_loaded_from_db_.insert(extendee);
1165     }
1166   }
1167 
1168   tables_->FindAllExtensions(extendee, out);
1169   if (underlay_ != NULL) {
1170     underlay_->FindAllExtensions(extendee, out);
1171   }
1172 }
1173 
1174 
1175 // -------------------------------------------------------------------
1176 
1177 const FieldDescriptor*
FindFieldByNumber(int key) const1178 Descriptor::FindFieldByNumber(int key) const {
1179   const FieldDescriptor* result =
1180     file()->tables_->FindFieldByNumber(this, key);
1181   if (result == NULL || result->is_extension()) {
1182     return NULL;
1183   } else {
1184     return result;
1185   }
1186 }
1187 
1188 const FieldDescriptor*
FindFieldByLowercaseName(const string & key) const1189 Descriptor::FindFieldByLowercaseName(const string& key) const {
1190   const FieldDescriptor* result =
1191     file()->tables_->FindFieldByLowercaseName(this, key);
1192   if (result == NULL || result->is_extension()) {
1193     return NULL;
1194   } else {
1195     return result;
1196   }
1197 }
1198 
1199 const FieldDescriptor*
FindFieldByCamelcaseName(const string & key) const1200 Descriptor::FindFieldByCamelcaseName(const string& key) const {
1201   const FieldDescriptor* result =
1202     file()->tables_->FindFieldByCamelcaseName(this, key);
1203   if (result == NULL || result->is_extension()) {
1204     return NULL;
1205   } else {
1206     return result;
1207   }
1208 }
1209 
1210 const FieldDescriptor*
FindFieldByName(const string & key) const1211 Descriptor::FindFieldByName(const string& key) const {
1212   Symbol result =
1213     file()->tables_->FindNestedSymbolOfType(this, key, Symbol::FIELD);
1214   if (!result.IsNull() && !result.field_descriptor->is_extension()) {
1215     return result.field_descriptor;
1216   } else {
1217     return NULL;
1218   }
1219 }
1220 
1221 const OneofDescriptor*
FindOneofByName(const string & key) const1222 Descriptor::FindOneofByName(const string& key) const {
1223   Symbol result =
1224     file()->tables_->FindNestedSymbolOfType(this, key, Symbol::ONEOF);
1225   if (!result.IsNull()) {
1226     return result.oneof_descriptor;
1227   } else {
1228     return NULL;
1229   }
1230 }
1231 
1232 const FieldDescriptor*
FindExtensionByName(const string & key) const1233 Descriptor::FindExtensionByName(const string& key) const {
1234   Symbol result =
1235     file()->tables_->FindNestedSymbolOfType(this, key, Symbol::FIELD);
1236   if (!result.IsNull() && result.field_descriptor->is_extension()) {
1237     return result.field_descriptor;
1238   } else {
1239     return NULL;
1240   }
1241 }
1242 
1243 const FieldDescriptor*
FindExtensionByLowercaseName(const string & key) const1244 Descriptor::FindExtensionByLowercaseName(const string& key) const {
1245   const FieldDescriptor* result =
1246     file()->tables_->FindFieldByLowercaseName(this, key);
1247   if (result == NULL || !result->is_extension()) {
1248     return NULL;
1249   } else {
1250     return result;
1251   }
1252 }
1253 
1254 const FieldDescriptor*
FindExtensionByCamelcaseName(const string & key) const1255 Descriptor::FindExtensionByCamelcaseName(const string& key) const {
1256   const FieldDescriptor* result =
1257     file()->tables_->FindFieldByCamelcaseName(this, key);
1258   if (result == NULL || !result->is_extension()) {
1259     return NULL;
1260   } else {
1261     return result;
1262   }
1263 }
1264 
1265 const Descriptor*
FindNestedTypeByName(const string & key) const1266 Descriptor::FindNestedTypeByName(const string& key) const {
1267   Symbol result =
1268     file()->tables_->FindNestedSymbolOfType(this, key, Symbol::MESSAGE);
1269   if (!result.IsNull()) {
1270     return result.descriptor;
1271   } else {
1272     return NULL;
1273   }
1274 }
1275 
1276 const EnumDescriptor*
FindEnumTypeByName(const string & key) const1277 Descriptor::FindEnumTypeByName(const string& key) const {
1278   Symbol result =
1279     file()->tables_->FindNestedSymbolOfType(this, key, Symbol::ENUM);
1280   if (!result.IsNull()) {
1281     return result.enum_descriptor;
1282   } else {
1283     return NULL;
1284   }
1285 }
1286 
1287 const EnumValueDescriptor*
FindEnumValueByName(const string & key) const1288 Descriptor::FindEnumValueByName(const string& key) const {
1289   Symbol result =
1290     file()->tables_->FindNestedSymbolOfType(this, key, Symbol::ENUM_VALUE);
1291   if (!result.IsNull()) {
1292     return result.enum_value_descriptor;
1293   } else {
1294     return NULL;
1295   }
1296 }
1297 
1298 const EnumValueDescriptor*
FindValueByName(const string & key) const1299 EnumDescriptor::FindValueByName(const string& key) const {
1300   Symbol result =
1301     file()->tables_->FindNestedSymbolOfType(this, key, Symbol::ENUM_VALUE);
1302   if (!result.IsNull()) {
1303     return result.enum_value_descriptor;
1304   } else {
1305     return NULL;
1306   }
1307 }
1308 
1309 const EnumValueDescriptor*
FindValueByNumber(int key) const1310 EnumDescriptor::FindValueByNumber(int key) const {
1311   return file()->tables_->FindEnumValueByNumber(this, key);
1312 }
1313 
1314 const MethodDescriptor*
FindMethodByName(const string & key) const1315 ServiceDescriptor::FindMethodByName(const string& key) const {
1316   Symbol result =
1317     file()->tables_->FindNestedSymbolOfType(this, key, Symbol::METHOD);
1318   if (!result.IsNull()) {
1319     return result.method_descriptor;
1320   } else {
1321     return NULL;
1322   }
1323 }
1324 
1325 const Descriptor*
FindMessageTypeByName(const string & key) const1326 FileDescriptor::FindMessageTypeByName(const string& key) const {
1327   Symbol result = tables_->FindNestedSymbolOfType(this, key, Symbol::MESSAGE);
1328   if (!result.IsNull()) {
1329     return result.descriptor;
1330   } else {
1331     return NULL;
1332   }
1333 }
1334 
1335 const EnumDescriptor*
FindEnumTypeByName(const string & key) const1336 FileDescriptor::FindEnumTypeByName(const string& key) const {
1337   Symbol result = tables_->FindNestedSymbolOfType(this, key, Symbol::ENUM);
1338   if (!result.IsNull()) {
1339     return result.enum_descriptor;
1340   } else {
1341     return NULL;
1342   }
1343 }
1344 
1345 const EnumValueDescriptor*
FindEnumValueByName(const string & key) const1346 FileDescriptor::FindEnumValueByName(const string& key) const {
1347   Symbol result =
1348     tables_->FindNestedSymbolOfType(this, key, Symbol::ENUM_VALUE);
1349   if (!result.IsNull()) {
1350     return result.enum_value_descriptor;
1351   } else {
1352     return NULL;
1353   }
1354 }
1355 
1356 const ServiceDescriptor*
FindServiceByName(const string & key) const1357 FileDescriptor::FindServiceByName(const string& key) const {
1358   Symbol result = tables_->FindNestedSymbolOfType(this, key, Symbol::SERVICE);
1359   if (!result.IsNull()) {
1360     return result.service_descriptor;
1361   } else {
1362     return NULL;
1363   }
1364 }
1365 
1366 const FieldDescriptor*
FindExtensionByName(const string & key) const1367 FileDescriptor::FindExtensionByName(const string& key) const {
1368   Symbol result = tables_->FindNestedSymbolOfType(this, key, Symbol::FIELD);
1369   if (!result.IsNull() && result.field_descriptor->is_extension()) {
1370     return result.field_descriptor;
1371   } else {
1372     return NULL;
1373   }
1374 }
1375 
1376 const FieldDescriptor*
FindExtensionByLowercaseName(const string & key) const1377 FileDescriptor::FindExtensionByLowercaseName(const string& key) const {
1378   const FieldDescriptor* result = tables_->FindFieldByLowercaseName(this, key);
1379   if (result == NULL || !result->is_extension()) {
1380     return NULL;
1381   } else {
1382     return result;
1383   }
1384 }
1385 
1386 const FieldDescriptor*
FindExtensionByCamelcaseName(const string & key) const1387 FileDescriptor::FindExtensionByCamelcaseName(const string& key) const {
1388   const FieldDescriptor* result = tables_->FindFieldByCamelcaseName(this, key);
1389   if (result == NULL || !result->is_extension()) {
1390     return NULL;
1391   } else {
1392     return result;
1393   }
1394 }
1395 
1396 const Descriptor::ExtensionRange*
FindExtensionRangeContainingNumber(int number) const1397 Descriptor::FindExtensionRangeContainingNumber(int number) const {
1398   // Linear search should be fine because we don't expect a message to have
1399   // more than a couple extension ranges.
1400   for (int i = 0; i < extension_range_count(); i++) {
1401     if (number >= extension_range(i)->start &&
1402         number <  extension_range(i)->end) {
1403       return extension_range(i);
1404     }
1405   }
1406   return NULL;
1407 }
1408 
1409 // -------------------------------------------------------------------
1410 
TryFindFileInFallbackDatabase(const string & name) const1411 bool DescriptorPool::TryFindFileInFallbackDatabase(const string& name) const {
1412   if (fallback_database_ == NULL) return false;
1413 
1414   if (tables_->known_bad_files_.count(name) > 0) return false;
1415 
1416   FileDescriptorProto file_proto;
1417   if (!fallback_database_->FindFileByName(name, &file_proto) ||
1418       BuildFileFromDatabase(file_proto) == NULL) {
1419     tables_->known_bad_files_.insert(name);
1420     return false;
1421   }
1422   return true;
1423 }
1424 
IsSubSymbolOfBuiltType(const string & name) const1425 bool DescriptorPool::IsSubSymbolOfBuiltType(const string& name) const {
1426   string prefix = name;
1427   for (;;) {
1428     string::size_type dot_pos = prefix.find_last_of('.');
1429     if (dot_pos == string::npos) {
1430       break;
1431     }
1432     prefix = prefix.substr(0, dot_pos);
1433     Symbol symbol = tables_->FindSymbol(prefix);
1434     // If the symbol type is anything other than PACKAGE, then its complete
1435     // definition is already known.
1436     if (!symbol.IsNull() && symbol.type != Symbol::PACKAGE) {
1437       return true;
1438     }
1439   }
1440   if (underlay_ != NULL) {
1441     // Check to see if any prefix of this symbol exists in the underlay.
1442     return underlay_->IsSubSymbolOfBuiltType(name);
1443   }
1444   return false;
1445 }
1446 
TryFindSymbolInFallbackDatabase(const string & name) const1447 bool DescriptorPool::TryFindSymbolInFallbackDatabase(const string& name) const {
1448   if (fallback_database_ == NULL) return false;
1449 
1450   if (tables_->known_bad_symbols_.count(name) > 0) return false;
1451 
1452   FileDescriptorProto file_proto;
1453   if (// We skip looking in the fallback database if the name is a sub-symbol
1454       // of any descriptor that already exists in the descriptor pool (except
1455       // for package descriptors).  This is valid because all symbols except
1456       // for packages are defined in a single file, so if the symbol exists
1457       // then we should already have its definition.
1458       //
1459       // The other reason to do this is to support "overriding" type
1460       // definitions by merging two databases that define the same type.  (Yes,
1461       // people do this.)  The main difficulty with making this work is that
1462       // FindFileContainingSymbol() is allowed to return both false positives
1463       // (e.g., SimpleDescriptorDatabase, UpgradedDescriptorDatabase) and false
1464       // negatives (e.g. ProtoFileParser, SourceTreeDescriptorDatabase).
1465       // When two such databases are merged, looking up a non-existent
1466       // sub-symbol of a type that already exists in the descriptor pool can
1467       // result in an attempt to load multiple definitions of the same type.
1468       // The check below avoids this.
1469       IsSubSymbolOfBuiltType(name)
1470 
1471       // Look up file containing this symbol in fallback database.
1472       || !fallback_database_->FindFileContainingSymbol(name, &file_proto)
1473 
1474       // Check if we've already built this file. If so, it apparently doesn't
1475       // contain the symbol we're looking for.  Some DescriptorDatabases
1476       // return false positives.
1477       || tables_->FindFile(file_proto.name()) != NULL
1478 
1479       // Build the file.
1480       || BuildFileFromDatabase(file_proto) == NULL) {
1481     tables_->known_bad_symbols_.insert(name);
1482     return false;
1483   }
1484 
1485   return true;
1486 }
1487 
TryFindExtensionInFallbackDatabase(const Descriptor * containing_type,int field_number) const1488 bool DescriptorPool::TryFindExtensionInFallbackDatabase(
1489     const Descriptor* containing_type, int field_number) const {
1490   if (fallback_database_ == NULL) return false;
1491 
1492   FileDescriptorProto file_proto;
1493   if (!fallback_database_->FindFileContainingExtension(
1494         containing_type->full_name(), field_number, &file_proto)) {
1495     return false;
1496   }
1497 
1498   if (tables_->FindFile(file_proto.name()) != NULL) {
1499     // We've already loaded this file, and it apparently doesn't contain the
1500     // extension we're looking for.  Some DescriptorDatabases return false
1501     // positives.
1502     return false;
1503   }
1504 
1505   if (BuildFileFromDatabase(file_proto) == NULL) {
1506     return false;
1507   }
1508 
1509   return true;
1510 }
1511 
1512 // ===================================================================
1513 
DefaultValueAsString(bool quote_string_type) const1514 string FieldDescriptor::DefaultValueAsString(bool quote_string_type) const {
1515   GOOGLE_CHECK(has_default_value()) << "No default value";
1516   switch (cpp_type()) {
1517     case CPPTYPE_INT32:
1518       return SimpleItoa(default_value_int32());
1519       break;
1520     case CPPTYPE_INT64:
1521       return SimpleItoa(default_value_int64());
1522       break;
1523     case CPPTYPE_UINT32:
1524       return SimpleItoa(default_value_uint32());
1525       break;
1526     case CPPTYPE_UINT64:
1527       return SimpleItoa(default_value_uint64());
1528       break;
1529     case CPPTYPE_FLOAT:
1530       return SimpleFtoa(default_value_float());
1531       break;
1532     case CPPTYPE_DOUBLE:
1533       return SimpleDtoa(default_value_double());
1534       break;
1535     case CPPTYPE_BOOL:
1536       return default_value_bool() ? "true" : "false";
1537       break;
1538     case CPPTYPE_STRING:
1539       if (quote_string_type) {
1540         return "\"" + CEscape(default_value_string()) + "\"";
1541       } else {
1542         if (type() == TYPE_BYTES) {
1543           return CEscape(default_value_string());
1544         } else {
1545           return default_value_string();
1546         }
1547       }
1548       break;
1549     case CPPTYPE_ENUM:
1550       return default_value_enum()->name();
1551       break;
1552     case CPPTYPE_MESSAGE:
1553       GOOGLE_LOG(DFATAL) << "Messages can't have default values!";
1554       break;
1555   }
1556   GOOGLE_LOG(FATAL) << "Can't get here: failed to get default value as string";
1557   return "";
1558 }
1559 
1560 // CopyTo methods ====================================================
1561 
CopyTo(FileDescriptorProto * proto) const1562 void FileDescriptor::CopyTo(FileDescriptorProto* proto) const {
1563   proto->set_name(name());
1564   if (!package().empty()) proto->set_package(package());
1565 
1566   for (int i = 0; i < dependency_count(); i++) {
1567     proto->add_dependency(dependency(i)->name());
1568   }
1569 
1570   for (int i = 0; i < public_dependency_count(); i++) {
1571     proto->add_public_dependency(public_dependencies_[i]);
1572   }
1573 
1574   for (int i = 0; i < weak_dependency_count(); i++) {
1575     proto->add_weak_dependency(weak_dependencies_[i]);
1576   }
1577 
1578   for (int i = 0; i < message_type_count(); i++) {
1579     message_type(i)->CopyTo(proto->add_message_type());
1580   }
1581   for (int i = 0; i < enum_type_count(); i++) {
1582     enum_type(i)->CopyTo(proto->add_enum_type());
1583   }
1584   for (int i = 0; i < service_count(); i++) {
1585     service(i)->CopyTo(proto->add_service());
1586   }
1587   for (int i = 0; i < extension_count(); i++) {
1588     extension(i)->CopyTo(proto->add_extension());
1589   }
1590 
1591   if (&options() != &FileOptions::default_instance()) {
1592     proto->mutable_options()->CopyFrom(options());
1593   }
1594 }
1595 
CopySourceCodeInfoTo(FileDescriptorProto * proto) const1596 void FileDescriptor::CopySourceCodeInfoTo(FileDescriptorProto* proto) const {
1597   if (source_code_info_ != &SourceCodeInfo::default_instance()) {
1598     proto->mutable_source_code_info()->CopyFrom(*source_code_info_);
1599   }
1600 }
1601 
CopyTo(DescriptorProto * proto) const1602 void Descriptor::CopyTo(DescriptorProto* proto) const {
1603   proto->set_name(name());
1604 
1605   for (int i = 0; i < field_count(); i++) {
1606     field(i)->CopyTo(proto->add_field());
1607   }
1608   for (int i = 0; i < oneof_decl_count(); i++) {
1609     oneof_decl(i)->CopyTo(proto->add_oneof_decl());
1610   }
1611   for (int i = 0; i < nested_type_count(); i++) {
1612     nested_type(i)->CopyTo(proto->add_nested_type());
1613   }
1614   for (int i = 0; i < enum_type_count(); i++) {
1615     enum_type(i)->CopyTo(proto->add_enum_type());
1616   }
1617   for (int i = 0; i < extension_range_count(); i++) {
1618     DescriptorProto::ExtensionRange* range = proto->add_extension_range();
1619     range->set_start(extension_range(i)->start);
1620     range->set_end(extension_range(i)->end);
1621   }
1622   for (int i = 0; i < extension_count(); i++) {
1623     extension(i)->CopyTo(proto->add_extension());
1624   }
1625 
1626   if (&options() != &MessageOptions::default_instance()) {
1627     proto->mutable_options()->CopyFrom(options());
1628   }
1629 }
1630 
CopyTo(FieldDescriptorProto * proto) const1631 void FieldDescriptor::CopyTo(FieldDescriptorProto* proto) const {
1632   proto->set_name(name());
1633   proto->set_number(number());
1634 
1635   // Some compilers do not allow static_cast directly between two enum types,
1636   // so we must cast to int first.
1637   proto->set_label(static_cast<FieldDescriptorProto::Label>(
1638                      implicit_cast<int>(label())));
1639   proto->set_type(static_cast<FieldDescriptorProto::Type>(
1640                     implicit_cast<int>(type())));
1641 
1642   if (is_extension()) {
1643     if (!containing_type()->is_unqualified_placeholder_) {
1644       proto->set_extendee(".");
1645     }
1646     proto->mutable_extendee()->append(containing_type()->full_name());
1647   }
1648 
1649   if (cpp_type() == CPPTYPE_MESSAGE) {
1650     if (message_type()->is_placeholder_) {
1651       // We don't actually know if the type is a message type.  It could be
1652       // an enum.
1653       proto->clear_type();
1654     }
1655 
1656     if (!message_type()->is_unqualified_placeholder_) {
1657       proto->set_type_name(".");
1658     }
1659     proto->mutable_type_name()->append(message_type()->full_name());
1660   } else if (cpp_type() == CPPTYPE_ENUM) {
1661     if (!enum_type()->is_unqualified_placeholder_) {
1662       proto->set_type_name(".");
1663     }
1664     proto->mutable_type_name()->append(enum_type()->full_name());
1665   }
1666 
1667   if (has_default_value()) {
1668     proto->set_default_value(DefaultValueAsString(false));
1669   }
1670 
1671   if (containing_oneof() != NULL && !is_extension()) {
1672     proto->set_oneof_index(containing_oneof()->index());
1673   }
1674 
1675   if (&options() != &FieldOptions::default_instance()) {
1676     proto->mutable_options()->CopyFrom(options());
1677   }
1678 }
1679 
CopyTo(OneofDescriptorProto * proto) const1680 void OneofDescriptor::CopyTo(OneofDescriptorProto* proto) const {
1681   proto->set_name(name());
1682 }
1683 
CopyTo(EnumDescriptorProto * proto) const1684 void EnumDescriptor::CopyTo(EnumDescriptorProto* proto) const {
1685   proto->set_name(name());
1686 
1687   for (int i = 0; i < value_count(); i++) {
1688     value(i)->CopyTo(proto->add_value());
1689   }
1690 
1691   if (&options() != &EnumOptions::default_instance()) {
1692     proto->mutable_options()->CopyFrom(options());
1693   }
1694 }
1695 
CopyTo(EnumValueDescriptorProto * proto) const1696 void EnumValueDescriptor::CopyTo(EnumValueDescriptorProto* proto) const {
1697   proto->set_name(name());
1698   proto->set_number(number());
1699 
1700   if (&options() != &EnumValueOptions::default_instance()) {
1701     proto->mutable_options()->CopyFrom(options());
1702   }
1703 }
1704 
CopyTo(ServiceDescriptorProto * proto) const1705 void ServiceDescriptor::CopyTo(ServiceDescriptorProto* proto) const {
1706   proto->set_name(name());
1707 
1708   for (int i = 0; i < method_count(); i++) {
1709     method(i)->CopyTo(proto->add_method());
1710   }
1711 
1712   if (&options() != &ServiceOptions::default_instance()) {
1713     proto->mutable_options()->CopyFrom(options());
1714   }
1715 }
1716 
CopyTo(MethodDescriptorProto * proto) const1717 void MethodDescriptor::CopyTo(MethodDescriptorProto* proto) const {
1718   proto->set_name(name());
1719 
1720   if (!input_type()->is_unqualified_placeholder_) {
1721     proto->set_input_type(".");
1722   }
1723   proto->mutable_input_type()->append(input_type()->full_name());
1724 
1725   if (!output_type()->is_unqualified_placeholder_) {
1726     proto->set_output_type(".");
1727   }
1728   proto->mutable_output_type()->append(output_type()->full_name());
1729 
1730   if (&options() != &MethodOptions::default_instance()) {
1731     proto->mutable_options()->CopyFrom(options());
1732   }
1733 }
1734 
1735 // DebugString methods ===============================================
1736 
1737 namespace {
1738 
1739 // Used by each of the option formatters.
RetrieveOptions(int depth,const Message & options,vector<string> * option_entries)1740 bool RetrieveOptions(int depth,
1741                      const Message &options,
1742                      vector<string> *option_entries) {
1743   option_entries->clear();
1744   const Reflection* reflection = options.GetReflection();
1745   vector<const FieldDescriptor*> fields;
1746   reflection->ListFields(options, &fields);
1747   for (int i = 0; i < fields.size(); i++) {
1748     int count = 1;
1749     bool repeated = false;
1750     if (fields[i]->is_repeated()) {
1751       count = reflection->FieldSize(options, fields[i]);
1752       repeated = true;
1753     }
1754     for (int j = 0; j < count; j++) {
1755       string fieldval;
1756       if (fields[i]->cpp_type() == FieldDescriptor::CPPTYPE_MESSAGE) {
1757         string tmp;
1758         TextFormat::Printer printer;
1759         printer.SetInitialIndentLevel(depth + 1);
1760         printer.PrintFieldValueToString(options, fields[i],
1761                                         repeated ? j : -1, &tmp);
1762         fieldval.append("{\n");
1763         fieldval.append(tmp);
1764         fieldval.append(depth * 2, ' ');
1765         fieldval.append("}");
1766       } else {
1767         TextFormat::PrintFieldValueToString(options, fields[i],
1768                                             repeated ? j : -1, &fieldval);
1769       }
1770       string name;
1771       if (fields[i]->is_extension()) {
1772         name = "(." + fields[i]->full_name() + ")";
1773       } else {
1774         name = fields[i]->name();
1775       }
1776       option_entries->push_back(name + " = " + fieldval);
1777     }
1778   }
1779   return !option_entries->empty();
1780 }
1781 
1782 // Formats options that all appear together in brackets. Does not include
1783 // brackets.
FormatBracketedOptions(int depth,const Message & options,string * output)1784 bool FormatBracketedOptions(int depth, const Message &options, string *output) {
1785   vector<string> all_options;
1786   if (RetrieveOptions(depth, options, &all_options)) {
1787     output->append(Join(all_options, ", "));
1788   }
1789   return !all_options.empty();
1790 }
1791 
1792 // Formats options one per line
FormatLineOptions(int depth,const Message & options,string * output)1793 bool FormatLineOptions(int depth, const Message &options, string *output) {
1794   string prefix(depth * 2, ' ');
1795   vector<string> all_options;
1796   if (RetrieveOptions(depth, options, &all_options)) {
1797     for (int i = 0; i < all_options.size(); i++) {
1798       strings::SubstituteAndAppend(output, "$0option $1;\n",
1799                                    prefix, all_options[i]);
1800     }
1801   }
1802   return !all_options.empty();
1803 }
1804 
1805 }  // anonymous namespace
1806 
DebugString() const1807 string FileDescriptor::DebugString() const {
1808   string contents = "syntax = \"proto2\";\n\n";
1809 
1810   set<int> public_dependencies;
1811   set<int> weak_dependencies;
1812   public_dependencies.insert(public_dependencies_,
1813                              public_dependencies_ + public_dependency_count_);
1814   weak_dependencies.insert(weak_dependencies_,
1815                            weak_dependencies_ + weak_dependency_count_);
1816 
1817   for (int i = 0; i < dependency_count(); i++) {
1818     if (public_dependencies.count(i) > 0) {
1819       strings::SubstituteAndAppend(&contents, "import public \"$0\";\n",
1820                                    dependency(i)->name());
1821     } else if (weak_dependencies.count(i) > 0) {
1822       strings::SubstituteAndAppend(&contents, "import weak \"$0\";\n",
1823                                    dependency(i)->name());
1824     } else {
1825       strings::SubstituteAndAppend(&contents, "import \"$0\";\n",
1826                                    dependency(i)->name());
1827     }
1828   }
1829 
1830   if (!package().empty()) {
1831     strings::SubstituteAndAppend(&contents, "package $0;\n\n", package());
1832   }
1833 
1834   if (FormatLineOptions(0, options(), &contents)) {
1835     contents.append("\n");  // add some space if we had options
1836   }
1837 
1838   for (int i = 0; i < enum_type_count(); i++) {
1839     enum_type(i)->DebugString(0, &contents);
1840     contents.append("\n");
1841   }
1842 
1843   // Find all the 'group' type extensions; we will not output their nested
1844   // definitions (those will be done with their group field descriptor).
1845   set<const Descriptor*> groups;
1846   for (int i = 0; i < extension_count(); i++) {
1847     if (extension(i)->type() == FieldDescriptor::TYPE_GROUP) {
1848       groups.insert(extension(i)->message_type());
1849     }
1850   }
1851 
1852   for (int i = 0; i < message_type_count(); i++) {
1853     if (groups.count(message_type(i)) == 0) {
1854       strings::SubstituteAndAppend(&contents, "message $0",
1855                                    message_type(i)->name());
1856       message_type(i)->DebugString(0, &contents);
1857       contents.append("\n");
1858     }
1859   }
1860 
1861   for (int i = 0; i < service_count(); i++) {
1862     service(i)->DebugString(&contents);
1863     contents.append("\n");
1864   }
1865 
1866   const Descriptor* containing_type = NULL;
1867   for (int i = 0; i < extension_count(); i++) {
1868     if (extension(i)->containing_type() != containing_type) {
1869       if (i > 0) contents.append("}\n\n");
1870       containing_type = extension(i)->containing_type();
1871       strings::SubstituteAndAppend(&contents, "extend .$0 {\n",
1872                                    containing_type->full_name());
1873     }
1874     extension(i)->DebugString(1, FieldDescriptor::PRINT_LABEL, &contents);
1875   }
1876   if (extension_count() > 0) contents.append("}\n\n");
1877 
1878   return contents;
1879 }
1880 
DebugString() const1881 string Descriptor::DebugString() const {
1882   string contents;
1883   strings::SubstituteAndAppend(&contents, "message $0", name());
1884   DebugString(0, &contents);
1885   return contents;
1886 }
1887 
DebugString(int depth,string * contents) const1888 void Descriptor::DebugString(int depth, string *contents) const {
1889   string prefix(depth * 2, ' ');
1890   ++depth;
1891   contents->append(" {\n");
1892 
1893   FormatLineOptions(depth, options(), contents);
1894 
1895   // Find all the 'group' types for fields and extensions; we will not output
1896   // their nested definitions (those will be done with their group field
1897   // descriptor).
1898   set<const Descriptor*> groups;
1899   for (int i = 0; i < field_count(); i++) {
1900     if (field(i)->type() == FieldDescriptor::TYPE_GROUP) {
1901       groups.insert(field(i)->message_type());
1902     }
1903   }
1904   for (int i = 0; i < extension_count(); i++) {
1905     if (extension(i)->type() == FieldDescriptor::TYPE_GROUP) {
1906       groups.insert(extension(i)->message_type());
1907     }
1908   }
1909 
1910   for (int i = 0; i < nested_type_count(); i++) {
1911     if (groups.count(nested_type(i)) == 0) {
1912       strings::SubstituteAndAppend(contents, "$0  message $1",
1913                                    prefix, nested_type(i)->name());
1914       nested_type(i)->DebugString(depth, contents);
1915     }
1916   }
1917   for (int i = 0; i < enum_type_count(); i++) {
1918     enum_type(i)->DebugString(depth, contents);
1919   }
1920   for (int i = 0; i < field_count(); i++) {
1921     if (field(i)->containing_oneof() == NULL) {
1922       field(i)->DebugString(depth, FieldDescriptor::PRINT_LABEL, contents);
1923     } else if (field(i)->containing_oneof()->field(0) == field(i)) {
1924       // This is the first field in this oneof, so print the whole oneof.
1925       field(i)->containing_oneof()->DebugString(depth, contents);
1926     }
1927   }
1928 
1929   for (int i = 0; i < extension_range_count(); i++) {
1930     strings::SubstituteAndAppend(contents, "$0  extensions $1 to $2;\n",
1931                                  prefix,
1932                                  extension_range(i)->start,
1933                                  extension_range(i)->end - 1);
1934   }
1935 
1936   // Group extensions by what they extend, so they can be printed out together.
1937   const Descriptor* containing_type = NULL;
1938   for (int i = 0; i < extension_count(); i++) {
1939     if (extension(i)->containing_type() != containing_type) {
1940       if (i > 0) strings::SubstituteAndAppend(contents, "$0  }\n", prefix);
1941       containing_type = extension(i)->containing_type();
1942       strings::SubstituteAndAppend(contents, "$0  extend .$1 {\n",
1943                                    prefix, containing_type->full_name());
1944     }
1945     extension(i)->DebugString(
1946         depth + 1, FieldDescriptor::PRINT_LABEL, contents);
1947   }
1948   if (extension_count() > 0)
1949     strings::SubstituteAndAppend(contents, "$0  }\n", prefix);
1950 
1951   strings::SubstituteAndAppend(contents, "$0}\n", prefix);
1952 }
1953 
DebugString() const1954 string FieldDescriptor::DebugString() const {
1955   string contents;
1956   int depth = 0;
1957   if (is_extension()) {
1958     strings::SubstituteAndAppend(&contents, "extend .$0 {\n",
1959                                  containing_type()->full_name());
1960     depth = 1;
1961   }
1962   DebugString(depth, PRINT_LABEL, &contents);
1963   if (is_extension()) {
1964     contents.append("}\n");
1965   }
1966   return contents;
1967 }
1968 
DebugString(int depth,PrintLabelFlag print_label_flag,string * contents) const1969 void FieldDescriptor::DebugString(int depth,
1970                                   PrintLabelFlag print_label_flag,
1971                                   string *contents) const {
1972   string prefix(depth * 2, ' ');
1973   string field_type;
1974   switch (type()) {
1975     case TYPE_MESSAGE:
1976       field_type = "." + message_type()->full_name();
1977       break;
1978     case TYPE_ENUM:
1979       field_type = "." + enum_type()->full_name();
1980       break;
1981     default:
1982       field_type = kTypeToName[type()];
1983   }
1984 
1985   string label;
1986   if (print_label_flag == PRINT_LABEL) {
1987     label = kLabelToName[this->label()];
1988     label.push_back(' ');
1989   }
1990 
1991   strings::SubstituteAndAppend(contents, "$0$1$2 $3 = $4",
1992                                prefix,
1993                                label,
1994                                field_type,
1995                                type() == TYPE_GROUP ? message_type()->name() :
1996                                                       name(),
1997                                number());
1998 
1999   bool bracketed = false;
2000   if (has_default_value()) {
2001     bracketed = true;
2002     strings::SubstituteAndAppend(contents, " [default = $0",
2003                                  DefaultValueAsString(true));
2004   }
2005 
2006   string formatted_options;
2007   if (FormatBracketedOptions(depth, options(), &formatted_options)) {
2008     contents->append(bracketed ? ", " : " [");
2009     bracketed = true;
2010     contents->append(formatted_options);
2011   }
2012 
2013   if (bracketed) {
2014     contents->append("]");
2015   }
2016 
2017   if (type() == TYPE_GROUP) {
2018     message_type()->DebugString(depth, contents);
2019   } else {
2020     contents->append(";\n");
2021   }
2022 }
2023 
DebugString() const2024 string OneofDescriptor::DebugString() const {
2025   string contents;
2026   DebugString(0, &contents);
2027   return contents;
2028 }
2029 
DebugString(int depth,string * contents) const2030 void OneofDescriptor::DebugString(int depth, string* contents) const {
2031   string prefix(depth * 2, ' ');
2032   ++depth;
2033   strings::SubstituteAndAppend(
2034       contents, "$0 oneof $1 {\n", prefix, name());
2035   for (int i = 0; i < field_count(); i++) {
2036     field(i)->DebugString(depth, FieldDescriptor::OMIT_LABEL, contents);
2037   }
2038   strings::SubstituteAndAppend(contents, "$0}\n", prefix);
2039 }
2040 
DebugString() const2041 string EnumDescriptor::DebugString() const {
2042   string contents;
2043   DebugString(0, &contents);
2044   return contents;
2045 }
2046 
DebugString(int depth,string * contents) const2047 void EnumDescriptor::DebugString(int depth, string *contents) const {
2048   string prefix(depth * 2, ' ');
2049   ++depth;
2050   strings::SubstituteAndAppend(contents, "$0enum $1 {\n",
2051                                prefix, name());
2052 
2053   FormatLineOptions(depth, options(), contents);
2054 
2055   for (int i = 0; i < value_count(); i++) {
2056     value(i)->DebugString(depth, contents);
2057   }
2058   strings::SubstituteAndAppend(contents, "$0}\n", prefix);
2059 }
2060 
DebugString() const2061 string EnumValueDescriptor::DebugString() const {
2062   string contents;
2063   DebugString(0, &contents);
2064   return contents;
2065 }
2066 
DebugString(int depth,string * contents) const2067 void EnumValueDescriptor::DebugString(int depth, string *contents) const {
2068   string prefix(depth * 2, ' ');
2069   strings::SubstituteAndAppend(contents, "$0$1 = $2",
2070                                prefix, name(), number());
2071 
2072   string formatted_options;
2073   if (FormatBracketedOptions(depth, options(), &formatted_options)) {
2074     strings::SubstituteAndAppend(contents, " [$0]", formatted_options);
2075   }
2076   contents->append(";\n");
2077 }
2078 
DebugString() const2079 string ServiceDescriptor::DebugString() const {
2080   string contents;
2081   DebugString(&contents);
2082   return contents;
2083 }
2084 
DebugString(string * contents) const2085 void ServiceDescriptor::DebugString(string *contents) const {
2086   strings::SubstituteAndAppend(contents, "service $0 {\n", name());
2087 
2088   FormatLineOptions(1, options(), contents);
2089 
2090   for (int i = 0; i < method_count(); i++) {
2091     method(i)->DebugString(1, contents);
2092   }
2093 
2094   contents->append("}\n");
2095 }
2096 
DebugString() const2097 string MethodDescriptor::DebugString() const {
2098   string contents;
2099   DebugString(0, &contents);
2100   return contents;
2101 }
2102 
DebugString(int depth,string * contents) const2103 void MethodDescriptor::DebugString(int depth, string *contents) const {
2104   string prefix(depth * 2, ' ');
2105   ++depth;
2106   strings::SubstituteAndAppend(contents, "$0rpc $1(.$2) returns (.$3)",
2107                                prefix, name(),
2108                                input_type()->full_name(),
2109                                output_type()->full_name());
2110 
2111   string formatted_options;
2112   if (FormatLineOptions(depth, options(), &formatted_options)) {
2113     strings::SubstituteAndAppend(contents, " {\n$0$1}\n",
2114                                  formatted_options, prefix);
2115   } else {
2116     contents->append(";\n");
2117   }
2118 }
2119 
2120 
2121 // Location methods ===============================================
2122 
GetSourceLocation(const vector<int> & path,SourceLocation * out_location) const2123 bool FileDescriptor::GetSourceLocation(const vector<int>& path,
2124                                        SourceLocation* out_location) const {
2125   GOOGLE_CHECK_NOTNULL(out_location);
2126   if (source_code_info_) {
2127     if (const SourceCodeInfo_Location* loc =
2128         tables_->GetSourceLocation(path, source_code_info_)) {
2129       const RepeatedField<int32>& span = loc->span();
2130       if (span.size() == 3 || span.size() == 4) {
2131         out_location->start_line   = span.Get(0);
2132         out_location->start_column = span.Get(1);
2133         out_location->end_line     = span.Get(span.size() == 3 ? 0 : 2);
2134         out_location->end_column   = span.Get(span.size() - 1);
2135 
2136         out_location->leading_comments = loc->leading_comments();
2137         out_location->trailing_comments = loc->trailing_comments();
2138         return true;
2139       }
2140     }
2141   }
2142   return false;
2143 }
2144 
is_packed() const2145 bool FieldDescriptor::is_packed() const {
2146   return is_packable() && (options_ != NULL) && options_->packed();
2147 }
2148 
GetSourceLocation(SourceLocation * out_location) const2149 bool Descriptor::GetSourceLocation(SourceLocation* out_location) const {
2150   vector<int> path;
2151   GetLocationPath(&path);
2152   return file()->GetSourceLocation(path, out_location);
2153 }
2154 
GetSourceLocation(SourceLocation * out_location) const2155 bool FieldDescriptor::GetSourceLocation(SourceLocation* out_location) const {
2156   vector<int> path;
2157   GetLocationPath(&path);
2158   return file()->GetSourceLocation(path, out_location);
2159 }
2160 
GetSourceLocation(SourceLocation * out_location) const2161 bool OneofDescriptor::GetSourceLocation(SourceLocation* out_location) const {
2162   vector<int> path;
2163   GetLocationPath(&path);
2164   return containing_type()->file()->GetSourceLocation(path, out_location);
2165 }
2166 
GetSourceLocation(SourceLocation * out_location) const2167 bool EnumDescriptor::GetSourceLocation(SourceLocation* out_location) const {
2168   vector<int> path;
2169   GetLocationPath(&path);
2170   return file()->GetSourceLocation(path, out_location);
2171 }
2172 
GetSourceLocation(SourceLocation * out_location) const2173 bool MethodDescriptor::GetSourceLocation(SourceLocation* out_location) const {
2174   vector<int> path;
2175   GetLocationPath(&path);
2176   return service()->file()->GetSourceLocation(path, out_location);
2177 }
2178 
GetSourceLocation(SourceLocation * out_location) const2179 bool ServiceDescriptor::GetSourceLocation(SourceLocation* out_location) const {
2180   vector<int> path;
2181   GetLocationPath(&path);
2182   return file()->GetSourceLocation(path, out_location);
2183 }
2184 
GetSourceLocation(SourceLocation * out_location) const2185 bool EnumValueDescriptor::GetSourceLocation(
2186     SourceLocation* out_location) const {
2187   vector<int> path;
2188   GetLocationPath(&path);
2189   return type()->file()->GetSourceLocation(path, out_location);
2190 }
2191 
GetLocationPath(vector<int> * output) const2192 void Descriptor::GetLocationPath(vector<int>* output) const {
2193   if (containing_type()) {
2194     containing_type()->GetLocationPath(output);
2195     output->push_back(DescriptorProto::kNestedTypeFieldNumber);
2196     output->push_back(index());
2197   } else {
2198     output->push_back(FileDescriptorProto::kMessageTypeFieldNumber);
2199     output->push_back(index());
2200   }
2201 }
2202 
GetLocationPath(vector<int> * output) const2203 void FieldDescriptor::GetLocationPath(vector<int>* output) const {
2204   if (is_extension()) {
2205     if (extension_scope() == NULL) {
2206       output->push_back(FileDescriptorProto::kExtensionFieldNumber);
2207       output->push_back(index());
2208     } else {
2209       extension_scope()->GetLocationPath(output);
2210       output->push_back(DescriptorProto::kExtensionFieldNumber);
2211       output->push_back(index());
2212     }
2213   } else {
2214     containing_type()->GetLocationPath(output);
2215     output->push_back(DescriptorProto::kFieldFieldNumber);
2216     output->push_back(index());
2217   }
2218 }
2219 
GetLocationPath(vector<int> * output) const2220 void OneofDescriptor::GetLocationPath(vector<int>* output) const {
2221   containing_type()->GetLocationPath(output);
2222   output->push_back(DescriptorProto::kOneofDeclFieldNumber);
2223   output->push_back(index());
2224 }
2225 
GetLocationPath(vector<int> * output) const2226 void EnumDescriptor::GetLocationPath(vector<int>* output) const {
2227   if (containing_type()) {
2228     containing_type()->GetLocationPath(output);
2229     output->push_back(DescriptorProto::kEnumTypeFieldNumber);
2230     output->push_back(index());
2231   } else {
2232     output->push_back(FileDescriptorProto::kEnumTypeFieldNumber);
2233     output->push_back(index());
2234   }
2235 }
2236 
GetLocationPath(vector<int> * output) const2237 void EnumValueDescriptor::GetLocationPath(vector<int>* output) const {
2238   type()->GetLocationPath(output);
2239   output->push_back(EnumDescriptorProto::kValueFieldNumber);
2240   output->push_back(index());
2241 }
2242 
GetLocationPath(vector<int> * output) const2243 void ServiceDescriptor::GetLocationPath(vector<int>* output) const {
2244   output->push_back(FileDescriptorProto::kServiceFieldNumber);
2245   output->push_back(index());
2246 }
2247 
GetLocationPath(vector<int> * output) const2248 void MethodDescriptor::GetLocationPath(vector<int>* output) const {
2249   service()->GetLocationPath(output);
2250   output->push_back(ServiceDescriptorProto::kMethodFieldNumber);
2251   output->push_back(index());
2252 }
2253 
2254 // ===================================================================
2255 
2256 namespace {
2257 
2258 // Represents an options message to interpret. Extension names in the option
2259 // name are respolved relative to name_scope. element_name and orig_opt are
2260 // used only for error reporting (since the parser records locations against
2261 // pointers in the original options, not the mutable copy). The Message must be
2262 // one of the Options messages in descriptor.proto.
2263 struct OptionsToInterpret {
OptionsToInterpretgoogle::protobuf::__anond0d5fb670511::OptionsToInterpret2264   OptionsToInterpret(const string& ns,
2265                      const string& el,
2266                      const Message* orig_opt,
2267                      Message* opt)
2268       : name_scope(ns),
2269         element_name(el),
2270         original_options(orig_opt),
2271         options(opt) {
2272   }
2273   string name_scope;
2274   string element_name;
2275   const Message* original_options;
2276   Message* options;
2277 };
2278 
2279 }  // namespace
2280 
2281 class DescriptorBuilder {
2282  public:
2283   DescriptorBuilder(const DescriptorPool* pool,
2284                     DescriptorPool::Tables* tables,
2285                     DescriptorPool::ErrorCollector* error_collector);
2286   ~DescriptorBuilder();
2287 
2288   const FileDescriptor* BuildFile(const FileDescriptorProto& proto);
2289 
2290  private:
2291   friend class OptionInterpreter;
2292 
2293   const DescriptorPool* pool_;
2294   DescriptorPool::Tables* tables_;  // for convenience
2295   DescriptorPool::ErrorCollector* error_collector_;
2296 
2297   // As we build descriptors we store copies of the options messages in
2298   // them. We put pointers to those copies in this vector, as we build, so we
2299   // can later (after cross-linking) interpret those options.
2300   vector<OptionsToInterpret> options_to_interpret_;
2301 
2302   bool had_errors_;
2303   string filename_;
2304   FileDescriptor* file_;
2305   FileDescriptorTables* file_tables_;
2306   set<const FileDescriptor*> dependencies_;
2307 
2308   // unused_dependency_ is used to record the unused imported files.
2309   // Note: public import is not considered.
2310   set<const FileDescriptor*> unused_dependency_;
2311 
2312   // If LookupSymbol() finds a symbol that is in a file which is not a declared
2313   // dependency of this file, it will fail, but will set
2314   // possible_undeclared_dependency_ to point at that file.  This is only used
2315   // by AddNotDefinedError() to report a more useful error message.
2316   // possible_undeclared_dependency_name_ is the name of the symbol that was
2317   // actually found in possible_undeclared_dependency_, which may be a parent
2318   // of the symbol actually looked for.
2319   const FileDescriptor* possible_undeclared_dependency_;
2320   string possible_undeclared_dependency_name_;
2321 
2322   // If LookupSymbol() could resolve a symbol which is not defined,
2323   // record the resolved name.  This is only used by AddNotDefinedError()
2324   // to report a more useful error message.
2325   string undefine_resolved_name_;
2326 
2327   void AddError(const string& element_name,
2328                 const Message& descriptor,
2329                 DescriptorPool::ErrorCollector::ErrorLocation location,
2330                 const string& error);
2331   void AddError(const string& element_name,
2332                 const Message& descriptor,
2333                 DescriptorPool::ErrorCollector::ErrorLocation location,
2334                 const char* error);
2335   void AddRecursiveImportError(const FileDescriptorProto& proto, int from_here);
2336   void AddTwiceListedError(const FileDescriptorProto& proto, int index);
2337   void AddImportError(const FileDescriptorProto& proto, int index);
2338 
2339   // Adds an error indicating that undefined_symbol was not defined.  Must
2340   // only be called after LookupSymbol() fails.
2341   void AddNotDefinedError(
2342     const string& element_name,
2343     const Message& descriptor,
2344     DescriptorPool::ErrorCollector::ErrorLocation location,
2345     const string& undefined_symbol);
2346 
2347   void AddWarning(const string& element_name, const Message& descriptor,
2348                   DescriptorPool::ErrorCollector::ErrorLocation location,
2349                   const string& error);
2350 
2351   // Silly helper which determines if the given file is in the given package.
2352   // I.e., either file->package() == package_name or file->package() is a
2353   // nested package within package_name.
2354   bool IsInPackage(const FileDescriptor* file, const string& package_name);
2355 
2356   // Helper function which finds all public dependencies of the given file, and
2357   // stores the them in the dependencies_ set in the builder.
2358   void RecordPublicDependencies(const FileDescriptor* file);
2359 
2360   // Like tables_->FindSymbol(), but additionally:
2361   // - Search the pool's underlay if not found in tables_.
2362   // - Insure that the resulting Symbol is from one of the file's declared
2363   //   dependencies.
2364   Symbol FindSymbol(const string& name);
2365 
2366   // Like FindSymbol() but does not require that the symbol is in one of the
2367   // file's declared dependencies.
2368   Symbol FindSymbolNotEnforcingDeps(const string& name);
2369 
2370   // This implements the body of FindSymbolNotEnforcingDeps().
2371   Symbol FindSymbolNotEnforcingDepsHelper(const DescriptorPool* pool,
2372                                           const string& name);
2373 
2374   // Like FindSymbol(), but looks up the name relative to some other symbol
2375   // name.  This first searches siblings of relative_to, then siblings of its
2376   // parents, etc.  For example, LookupSymbol("foo.bar", "baz.qux.corge") makes
2377   // the following calls, returning the first non-null result:
2378   // FindSymbol("baz.qux.foo.bar"), FindSymbol("baz.foo.bar"),
2379   // FindSymbol("foo.bar").  If AllowUnknownDependencies() has been called
2380   // on the DescriptorPool, this will generate a placeholder type if
2381   // the name is not found (unless the name itself is malformed).  The
2382   // placeholder_type parameter indicates what kind of placeholder should be
2383   // constructed in this case.  The resolve_mode parameter determines whether
2384   // any symbol is returned, or only symbols that are types.  Note, however,
2385   // that LookupSymbol may still return a non-type symbol in LOOKUP_TYPES mode,
2386   // if it believes that's all it could refer to.  The caller should always
2387   // check that it receives the type of symbol it was expecting.
2388   enum PlaceholderType {
2389     PLACEHOLDER_MESSAGE,
2390     PLACEHOLDER_ENUM,
2391     PLACEHOLDER_EXTENDABLE_MESSAGE
2392   };
2393   enum ResolveMode {
2394     LOOKUP_ALL, LOOKUP_TYPES
2395   };
2396   Symbol LookupSymbol(const string& name, const string& relative_to,
2397                       PlaceholderType placeholder_type = PLACEHOLDER_MESSAGE,
2398                       ResolveMode resolve_mode = LOOKUP_ALL);
2399 
2400   // Like LookupSymbol() but will not return a placeholder even if
2401   // AllowUnknownDependencies() has been used.
2402   Symbol LookupSymbolNoPlaceholder(const string& name,
2403                                    const string& relative_to,
2404                                    ResolveMode resolve_mode = LOOKUP_ALL);
2405 
2406   // Creates a placeholder type suitable for return from LookupSymbol().  May
2407   // return kNullSymbol if the name is not a valid type name.
2408   Symbol NewPlaceholder(const string& name, PlaceholderType placeholder_type);
2409 
2410   // Creates a placeholder file.  Never returns NULL.  This is used when an
2411   // import is not found and AllowUnknownDependencies() is enabled.
2412   const FileDescriptor* NewPlaceholderFile(const string& name);
2413 
2414   // Calls tables_->AddSymbol() and records an error if it fails.  Returns
2415   // true if successful or false if failed, though most callers can ignore
2416   // the return value since an error has already been recorded.
2417   bool AddSymbol(const string& full_name,
2418                  const void* parent, const string& name,
2419                  const Message& proto, Symbol symbol);
2420 
2421   // Like AddSymbol(), but succeeds if the symbol is already defined as long
2422   // as the existing definition is also a package (because it's OK to define
2423   // the same package in two different files).  Also adds all parents of the
2424   // packgae to the symbol table (e.g. AddPackage("foo.bar", ...) will add
2425   // "foo.bar" and "foo" to the table).
2426   void AddPackage(const string& name, const Message& proto,
2427                   const FileDescriptor* file);
2428 
2429   // Checks that the symbol name contains only alphanumeric characters and
2430   // underscores.  Records an error otherwise.
2431   void ValidateSymbolName(const string& name, const string& full_name,
2432                           const Message& proto);
2433 
2434   // Like ValidateSymbolName(), but the name is allowed to contain periods and
2435   // an error is indicated by returning false (not recording the error).
2436   bool ValidateQualifiedName(const string& name);
2437 
2438   // Used by BUILD_ARRAY macro (below) to avoid having to have the type
2439   // specified as a macro parameter.
2440   template <typename Type>
AllocateArray(int size,Type ** output)2441   inline void AllocateArray(int size, Type** output) {
2442     *output = tables_->AllocateArray<Type>(size);
2443   }
2444 
2445   // Allocates a copy of orig_options in tables_ and stores it in the
2446   // descriptor. Remembers its uninterpreted options, to be interpreted
2447   // later. DescriptorT must be one of the Descriptor messages from
2448   // descriptor.proto.
2449   template<class DescriptorT> void AllocateOptions(
2450       const typename DescriptorT::OptionsType& orig_options,
2451       DescriptorT* descriptor);
2452   // Specialization for FileOptions.
2453   void AllocateOptions(const FileOptions& orig_options,
2454                        FileDescriptor* descriptor);
2455 
2456   // Implementation for AllocateOptions(). Don't call this directly.
2457   template<class DescriptorT> void AllocateOptionsImpl(
2458       const string& name_scope,
2459       const string& element_name,
2460       const typename DescriptorT::OptionsType& orig_options,
2461       DescriptorT* descriptor);
2462 
2463   // These methods all have the same signature for the sake of the BUILD_ARRAY
2464   // macro, below.
2465   void BuildMessage(const DescriptorProto& proto,
2466                     const Descriptor* parent,
2467                     Descriptor* result);
2468   void BuildFieldOrExtension(const FieldDescriptorProto& proto,
2469                              const Descriptor* parent,
2470                              FieldDescriptor* result,
2471                              bool is_extension);
BuildField(const FieldDescriptorProto & proto,const Descriptor * parent,FieldDescriptor * result)2472   void BuildField(const FieldDescriptorProto& proto,
2473                   const Descriptor* parent,
2474                   FieldDescriptor* result) {
2475     BuildFieldOrExtension(proto, parent, result, false);
2476   }
BuildExtension(const FieldDescriptorProto & proto,const Descriptor * parent,FieldDescriptor * result)2477   void BuildExtension(const FieldDescriptorProto& proto,
2478                       const Descriptor* parent,
2479                       FieldDescriptor* result) {
2480     BuildFieldOrExtension(proto, parent, result, true);
2481   }
2482   void BuildExtensionRange(const DescriptorProto::ExtensionRange& proto,
2483                            const Descriptor* parent,
2484                            Descriptor::ExtensionRange* result);
2485   void BuildOneof(const OneofDescriptorProto& proto,
2486                   Descriptor* parent,
2487                   OneofDescriptor* result);
2488   void BuildEnum(const EnumDescriptorProto& proto,
2489                  const Descriptor* parent,
2490                  EnumDescriptor* result);
2491   void BuildEnumValue(const EnumValueDescriptorProto& proto,
2492                       const EnumDescriptor* parent,
2493                       EnumValueDescriptor* result);
2494   void BuildService(const ServiceDescriptorProto& proto,
2495                     const void* dummy,
2496                     ServiceDescriptor* result);
2497   void BuildMethod(const MethodDescriptorProto& proto,
2498                    const ServiceDescriptor* parent,
2499                    MethodDescriptor* result);
2500 
2501   void LogUnusedDependency(const FileDescriptor* result);
2502 
2503   // Must be run only after building.
2504   //
2505   // NOTE: Options will not be available during cross-linking, as they
2506   // have not yet been interpreted. Defer any handling of options to the
2507   // Validate*Options methods.
2508   void CrossLinkFile(FileDescriptor* file, const FileDescriptorProto& proto);
2509   void CrossLinkMessage(Descriptor* message, const DescriptorProto& proto);
2510   void CrossLinkField(FieldDescriptor* field,
2511                       const FieldDescriptorProto& proto);
2512   void CrossLinkEnum(EnumDescriptor* enum_type,
2513                      const EnumDescriptorProto& proto);
2514   void CrossLinkEnumValue(EnumValueDescriptor* enum_value,
2515                           const EnumValueDescriptorProto& proto);
2516   void CrossLinkService(ServiceDescriptor* service,
2517                         const ServiceDescriptorProto& proto);
2518   void CrossLinkMethod(MethodDescriptor* method,
2519                        const MethodDescriptorProto& proto);
2520 
2521   // Must be run only after cross-linking.
2522   void InterpretOptions();
2523 
2524   // A helper class for interpreting options.
2525   class OptionInterpreter {
2526    public:
2527     // Creates an interpreter that operates in the context of the pool of the
2528     // specified builder, which must not be NULL. We don't take ownership of the
2529     // builder.
2530     explicit OptionInterpreter(DescriptorBuilder* builder);
2531 
2532     ~OptionInterpreter();
2533 
2534     // Interprets the uninterpreted options in the specified Options message.
2535     // On error, calls AddError() on the underlying builder and returns false.
2536     // Otherwise returns true.
2537     bool InterpretOptions(OptionsToInterpret* options_to_interpret);
2538 
2539     class AggregateOptionFinder;
2540 
2541    private:
2542     // Interprets uninterpreted_option_ on the specified message, which
2543     // must be the mutable copy of the original options message to which
2544     // uninterpreted_option_ belongs.
2545     bool InterpretSingleOption(Message* options);
2546 
2547     // Adds the uninterpreted_option to the given options message verbatim.
2548     // Used when AllowUnknownDependencies() is in effect and we can't find
2549     // the option's definition.
2550     void AddWithoutInterpreting(const UninterpretedOption& uninterpreted_option,
2551                                 Message* options);
2552 
2553     // A recursive helper function that drills into the intermediate fields
2554     // in unknown_fields to check if field innermost_field is set on the
2555     // innermost message. Returns false and sets an error if so.
2556     bool ExamineIfOptionIsSet(
2557         vector<const FieldDescriptor*>::const_iterator intermediate_fields_iter,
2558         vector<const FieldDescriptor*>::const_iterator intermediate_fields_end,
2559         const FieldDescriptor* innermost_field, const string& debug_msg_name,
2560         const UnknownFieldSet& unknown_fields);
2561 
2562     // Validates the value for the option field of the currently interpreted
2563     // option and then sets it on the unknown_field.
2564     bool SetOptionValue(const FieldDescriptor* option_field,
2565                         UnknownFieldSet* unknown_fields);
2566 
2567     // Parses an aggregate value for a CPPTYPE_MESSAGE option and
2568     // saves it into *unknown_fields.
2569     bool SetAggregateOption(const FieldDescriptor* option_field,
2570                             UnknownFieldSet* unknown_fields);
2571 
2572     // Convenience functions to set an int field the right way, depending on
2573     // its wire type (a single int CppType can represent multiple wire types).
2574     void SetInt32(int number, int32 value, FieldDescriptor::Type type,
2575                   UnknownFieldSet* unknown_fields);
2576     void SetInt64(int number, int64 value, FieldDescriptor::Type type,
2577                   UnknownFieldSet* unknown_fields);
2578     void SetUInt32(int number, uint32 value, FieldDescriptor::Type type,
2579                    UnknownFieldSet* unknown_fields);
2580     void SetUInt64(int number, uint64 value, FieldDescriptor::Type type,
2581                    UnknownFieldSet* unknown_fields);
2582 
2583     // A helper function that adds an error at the specified location of the
2584     // option we're currently interpreting, and returns false.
AddOptionError(DescriptorPool::ErrorCollector::ErrorLocation location,const string & msg)2585     bool AddOptionError(DescriptorPool::ErrorCollector::ErrorLocation location,
2586                         const string& msg) {
2587       builder_->AddError(options_to_interpret_->element_name,
2588                          *uninterpreted_option_, location, msg);
2589       return false;
2590     }
2591 
2592     // A helper function that adds an error at the location of the option name
2593     // and returns false.
AddNameError(const string & msg)2594     bool AddNameError(const string& msg) {
2595       return AddOptionError(DescriptorPool::ErrorCollector::OPTION_NAME, msg);
2596     }
2597 
2598     // A helper function that adds an error at the location of the option name
2599     // and returns false.
AddValueError(const string & msg)2600     bool AddValueError(const string& msg) {
2601       return AddOptionError(DescriptorPool::ErrorCollector::OPTION_VALUE, msg);
2602     }
2603 
2604     // We interpret against this builder's pool. Is never NULL. We don't own
2605     // this pointer.
2606     DescriptorBuilder* builder_;
2607 
2608     // The options we're currently interpreting, or NULL if we're not in a call
2609     // to InterpretOptions.
2610     const OptionsToInterpret* options_to_interpret_;
2611 
2612     // The option we're currently interpreting within options_to_interpret_, or
2613     // NULL if we're not in a call to InterpretOptions(). This points to a
2614     // submessage of the original option, not the mutable copy. Therefore we
2615     // can use it to find locations recorded by the parser.
2616     const UninterpretedOption* uninterpreted_option_;
2617 
2618     // Factory used to create the dynamic messages we need to parse
2619     // any aggregate option values we encounter.
2620     DynamicMessageFactory dynamic_factory_;
2621 
2622     GOOGLE_DISALLOW_EVIL_CONSTRUCTORS(OptionInterpreter);
2623   };
2624 
2625   // Work-around for broken compilers:  According to the C++ standard,
2626   // OptionInterpreter should have access to the private members of any class
2627   // which has declared DescriptorBuilder as a friend.  Unfortunately some old
2628   // versions of GCC and other compilers do not implement this correctly.  So,
2629   // we have to have these intermediate methods to provide access.  We also
2630   // redundantly declare OptionInterpreter a friend just to make things extra
2631   // clear for these bad compilers.
2632   friend class OptionInterpreter;
2633   friend class OptionInterpreter::AggregateOptionFinder;
2634 
get_allow_unknown(const DescriptorPool * pool)2635   static inline bool get_allow_unknown(const DescriptorPool* pool) {
2636     return pool->allow_unknown_;
2637   }
get_enforce_weak(const DescriptorPool * pool)2638   static inline bool get_enforce_weak(const DescriptorPool* pool) {
2639     return pool->enforce_weak_;
2640   }
get_is_placeholder(const Descriptor * descriptor)2641   static inline bool get_is_placeholder(const Descriptor* descriptor) {
2642     return descriptor->is_placeholder_;
2643   }
assert_mutex_held(const DescriptorPool * pool)2644   static inline void assert_mutex_held(const DescriptorPool* pool) {
2645     if (pool->mutex_ != NULL) {
2646       pool->mutex_->AssertHeld();
2647     }
2648   }
2649 
2650   // Must be run only after options have been interpreted.
2651   //
2652   // NOTE: Validation code must only reference the options in the mutable
2653   // descriptors, which are the ones that have been interpreted. The const
2654   // proto references are passed in only so they can be provided to calls to
2655   // AddError(). Do not look at their options, which have not been interpreted.
2656   void ValidateFileOptions(FileDescriptor* file,
2657                            const FileDescriptorProto& proto);
2658   void ValidateMessageOptions(Descriptor* message,
2659                               const DescriptorProto& proto);
2660   void ValidateFieldOptions(FieldDescriptor* field,
2661                             const FieldDescriptorProto& proto);
2662   void ValidateEnumOptions(EnumDescriptor* enm,
2663                            const EnumDescriptorProto& proto);
2664   void ValidateEnumValueOptions(EnumValueDescriptor* enum_value,
2665                                 const EnumValueDescriptorProto& proto);
2666   void ValidateServiceOptions(ServiceDescriptor* service,
2667                               const ServiceDescriptorProto& proto);
2668   void ValidateMethodOptions(MethodDescriptor* method,
2669                              const MethodDescriptorProto& proto);
2670 
2671   void ValidateMapKey(FieldDescriptor* field,
2672                       const FieldDescriptorProto& proto);
2673 
2674 };
2675 
BuildFile(const FileDescriptorProto & proto)2676 const FileDescriptor* DescriptorPool::BuildFile(
2677     const FileDescriptorProto& proto) {
2678   GOOGLE_CHECK(fallback_database_ == NULL)
2679     << "Cannot call BuildFile on a DescriptorPool that uses a "
2680        "DescriptorDatabase.  You must instead find a way to get your file "
2681        "into the underlying database.";
2682   GOOGLE_CHECK(mutex_ == NULL);   // Implied by the above GOOGLE_CHECK.
2683   tables_->known_bad_symbols_.clear();
2684   tables_->known_bad_files_.clear();
2685   return DescriptorBuilder(this, tables_.get(), NULL).BuildFile(proto);
2686 }
2687 
BuildFileCollectingErrors(const FileDescriptorProto & proto,ErrorCollector * error_collector)2688 const FileDescriptor* DescriptorPool::BuildFileCollectingErrors(
2689     const FileDescriptorProto& proto,
2690     ErrorCollector* error_collector) {
2691   GOOGLE_CHECK(fallback_database_ == NULL)
2692     << "Cannot call BuildFile on a DescriptorPool that uses a "
2693        "DescriptorDatabase.  You must instead find a way to get your file "
2694        "into the underlying database.";
2695   GOOGLE_CHECK(mutex_ == NULL);   // Implied by the above GOOGLE_CHECK.
2696   tables_->known_bad_symbols_.clear();
2697   tables_->known_bad_files_.clear();
2698   return DescriptorBuilder(this, tables_.get(),
2699                            error_collector).BuildFile(proto);
2700 }
2701 
BuildFileFromDatabase(const FileDescriptorProto & proto) const2702 const FileDescriptor* DescriptorPool::BuildFileFromDatabase(
2703     const FileDescriptorProto& proto) const {
2704   mutex_->AssertHeld();
2705   if (tables_->known_bad_files_.count(proto.name()) > 0) {
2706     return NULL;
2707   }
2708   const FileDescriptor* result =
2709       DescriptorBuilder(this, tables_.get(),
2710                         default_error_collector_).BuildFile(proto);
2711   if (result == NULL) {
2712     tables_->known_bad_files_.insert(proto.name());
2713   }
2714   return result;
2715 }
2716 
DescriptorBuilder(const DescriptorPool * pool,DescriptorPool::Tables * tables,DescriptorPool::ErrorCollector * error_collector)2717 DescriptorBuilder::DescriptorBuilder(
2718     const DescriptorPool* pool,
2719     DescriptorPool::Tables* tables,
2720     DescriptorPool::ErrorCollector* error_collector)
2721   : pool_(pool),
2722     tables_(tables),
2723     error_collector_(error_collector),
2724     had_errors_(false),
2725     possible_undeclared_dependency_(NULL),
2726     undefine_resolved_name_("") {}
2727 
~DescriptorBuilder()2728 DescriptorBuilder::~DescriptorBuilder() {}
2729 
AddError(const string & element_name,const Message & descriptor,DescriptorPool::ErrorCollector::ErrorLocation location,const string & error)2730 void DescriptorBuilder::AddError(
2731     const string& element_name,
2732     const Message& descriptor,
2733     DescriptorPool::ErrorCollector::ErrorLocation location,
2734     const string& error) {
2735   if (error_collector_ == NULL) {
2736     if (!had_errors_) {
2737       GOOGLE_LOG(ERROR) << "Invalid proto descriptor for file \"" << filename_
2738                  << "\":";
2739     }
2740     GOOGLE_LOG(ERROR) << "  " << element_name << ": " << error;
2741   } else {
2742     error_collector_->AddError(filename_, element_name,
2743                                &descriptor, location, error);
2744   }
2745   had_errors_ = true;
2746 }
2747 
AddError(const string & element_name,const Message & descriptor,DescriptorPool::ErrorCollector::ErrorLocation location,const char * error)2748 void DescriptorBuilder::AddError(
2749     const string& element_name,
2750     const Message& descriptor,
2751     DescriptorPool::ErrorCollector::ErrorLocation location,
2752     const char* error) {
2753   AddError(element_name, descriptor, location, string(error));
2754 }
2755 
AddNotDefinedError(const string & element_name,const Message & descriptor,DescriptorPool::ErrorCollector::ErrorLocation location,const string & undefined_symbol)2756 void DescriptorBuilder::AddNotDefinedError(
2757     const string& element_name,
2758     const Message& descriptor,
2759     DescriptorPool::ErrorCollector::ErrorLocation location,
2760     const string& undefined_symbol) {
2761   if (possible_undeclared_dependency_ == NULL &&
2762       undefine_resolved_name_.empty()) {
2763     AddError(element_name, descriptor, location,
2764              "\"" + undefined_symbol + "\" is not defined.");
2765   } else {
2766     if (possible_undeclared_dependency_ != NULL) {
2767       AddError(element_name, descriptor, location,
2768                "\"" + possible_undeclared_dependency_name_ +
2769                "\" seems to be defined in \"" +
2770                possible_undeclared_dependency_->name() + "\", which is not "
2771                "imported by \"" + filename_ + "\".  To use it here, please "
2772                "add the necessary import.");
2773     }
2774     if (!undefine_resolved_name_.empty()) {
2775       AddError(element_name, descriptor, location,
2776                "\"" + undefined_symbol + "\" is resolved to \"" +
2777                undefine_resolved_name_ + "\", which is not defined. "
2778                "The innermost scope is searched first in name resolution. "
2779                "Consider using a leading '.'(i.e., \"."
2780                + undefined_symbol +
2781                "\") to start from the outermost scope.");
2782     }
2783   }
2784 }
2785 
AddWarning(const string & element_name,const Message & descriptor,DescriptorPool::ErrorCollector::ErrorLocation location,const string & error)2786 void DescriptorBuilder::AddWarning(
2787     const string& element_name, const Message& descriptor,
2788     DescriptorPool::ErrorCollector::ErrorLocation location,
2789     const string& error) {
2790   if (error_collector_ == NULL) {
2791     GOOGLE_LOG(WARNING) << filename_ << " " << element_name << ": " << error;
2792   } else {
2793     error_collector_->AddWarning(filename_, element_name, &descriptor, location,
2794                                  error);
2795   }
2796 }
2797 
IsInPackage(const FileDescriptor * file,const string & package_name)2798 bool DescriptorBuilder::IsInPackage(const FileDescriptor* file,
2799                                     const string& package_name) {
2800   return HasPrefixString(file->package(), package_name) &&
2801            (file->package().size() == package_name.size() ||
2802             file->package()[package_name.size()] == '.');
2803 }
2804 
RecordPublicDependencies(const FileDescriptor * file)2805 void DescriptorBuilder::RecordPublicDependencies(const FileDescriptor* file) {
2806   if (file == NULL || !dependencies_.insert(file).second) return;
2807   for (int i = 0; file != NULL && i < file->public_dependency_count(); i++) {
2808     RecordPublicDependencies(file->public_dependency(i));
2809   }
2810 }
2811 
FindSymbolNotEnforcingDepsHelper(const DescriptorPool * pool,const string & name)2812 Symbol DescriptorBuilder::FindSymbolNotEnforcingDepsHelper(
2813     const DescriptorPool* pool, const string& name) {
2814   // If we are looking at an underlay, we must lock its mutex_, since we are
2815   // accessing the underlay's tables_ directly.
2816   MutexLockMaybe lock((pool == pool_) ? NULL : pool->mutex_);
2817 
2818   Symbol result = pool->tables_->FindSymbol(name);
2819   if (result.IsNull() && pool->underlay_ != NULL) {
2820     // Symbol not found; check the underlay.
2821     result = FindSymbolNotEnforcingDepsHelper(pool->underlay_, name);
2822   }
2823 
2824   if (result.IsNull()) {
2825     // In theory, we shouldn't need to check fallback_database_ because the
2826     // symbol should be in one of its file's direct dependencies, and we have
2827     // already loaded those by the time we get here.  But we check anyway so
2828     // that we can generate better error message when dependencies are missing
2829     // (i.e., "missing dependency" rather than "type is not defined").
2830     if (pool->TryFindSymbolInFallbackDatabase(name)) {
2831       result = pool->tables_->FindSymbol(name);
2832     }
2833   }
2834 
2835   return result;
2836 }
2837 
FindSymbolNotEnforcingDeps(const string & name)2838 Symbol DescriptorBuilder::FindSymbolNotEnforcingDeps(const string& name) {
2839   return FindSymbolNotEnforcingDepsHelper(pool_, name);
2840 }
2841 
FindSymbol(const string & name)2842 Symbol DescriptorBuilder::FindSymbol(const string& name) {
2843   Symbol result = FindSymbolNotEnforcingDeps(name);
2844 
2845   if (result.IsNull()) return result;
2846 
2847   if (!pool_->enforce_dependencies_) {
2848     // Hack for CompilerUpgrader.
2849     return result;
2850   }
2851 
2852   // Only find symbols which were defined in this file or one of its
2853   // dependencies.
2854   const FileDescriptor* file = result.GetFile();
2855   if (file == file_ || dependencies_.count(file) > 0) {
2856     unused_dependency_.erase(file);
2857     return result;
2858   }
2859 
2860   if (result.type == Symbol::PACKAGE) {
2861     // Arg, this is overcomplicated.  The symbol is a package name.  It could
2862     // be that the package was defined in multiple files.  result.GetFile()
2863     // returns the first file we saw that used this package.  We've determined
2864     // that that file is not a direct dependency of the file we are currently
2865     // building, but it could be that some other file which *is* a direct
2866     // dependency also defines the same package.  We can't really rule out this
2867     // symbol unless none of the dependencies define it.
2868     if (IsInPackage(file_, name)) return result;
2869     for (set<const FileDescriptor*>::const_iterator it = dependencies_.begin();
2870          it != dependencies_.end(); ++it) {
2871       // Note:  A dependency may be NULL if it was not found or had errors.
2872       if (*it != NULL && IsInPackage(*it, name)) return result;
2873     }
2874   }
2875 
2876   possible_undeclared_dependency_ = file;
2877   possible_undeclared_dependency_name_ = name;
2878   return kNullSymbol;
2879 }
2880 
LookupSymbolNoPlaceholder(const string & name,const string & relative_to,ResolveMode resolve_mode)2881 Symbol DescriptorBuilder::LookupSymbolNoPlaceholder(
2882     const string& name, const string& relative_to, ResolveMode resolve_mode) {
2883   possible_undeclared_dependency_ = NULL;
2884   undefine_resolved_name_.clear();
2885 
2886   if (name.size() > 0 && name[0] == '.') {
2887     // Fully-qualified name.
2888     return FindSymbol(name.substr(1));
2889   }
2890 
2891   // If name is something like "Foo.Bar.baz", and symbols named "Foo" are
2892   // defined in multiple parent scopes, we only want to find "Bar.baz" in the
2893   // innermost one.  E.g., the following should produce an error:
2894   //   message Bar { message Baz {} }
2895   //   message Foo {
2896   //     message Bar {
2897   //     }
2898   //     optional Bar.Baz baz = 1;
2899   //   }
2900   // So, we look for just "Foo" first, then look for "Bar.baz" within it if
2901   // found.
2902   string::size_type name_dot_pos = name.find_first_of('.');
2903   string first_part_of_name;
2904   if (name_dot_pos == string::npos) {
2905     first_part_of_name = name;
2906   } else {
2907     first_part_of_name = name.substr(0, name_dot_pos);
2908   }
2909 
2910   string scope_to_try(relative_to);
2911 
2912   while (true) {
2913     // Chop off the last component of the scope.
2914     string::size_type dot_pos = scope_to_try.find_last_of('.');
2915     if (dot_pos == string::npos) {
2916       return FindSymbol(name);
2917     } else {
2918       scope_to_try.erase(dot_pos);
2919     }
2920 
2921     // Append ".first_part_of_name" and try to find.
2922     string::size_type old_size = scope_to_try.size();
2923     scope_to_try.append(1, '.');
2924     scope_to_try.append(first_part_of_name);
2925     Symbol result = FindSymbol(scope_to_try);
2926     if (!result.IsNull()) {
2927       if (first_part_of_name.size() < name.size()) {
2928         // name is a compound symbol, of which we only found the first part.
2929         // Now try to look up the rest of it.
2930         if (result.IsAggregate()) {
2931           scope_to_try.append(name, first_part_of_name.size(),
2932                               name.size() - first_part_of_name.size());
2933           result = FindSymbol(scope_to_try);
2934           if (result.IsNull()) {
2935             undefine_resolved_name_ = scope_to_try;
2936           }
2937           return result;
2938         } else {
2939           // We found a symbol but it's not an aggregate.  Continue the loop.
2940         }
2941       } else {
2942         if (resolve_mode == LOOKUP_TYPES && !result.IsType()) {
2943           // We found a symbol but it's not a type.  Continue the loop.
2944         } else {
2945           return result;
2946         }
2947       }
2948     }
2949 
2950     // Not found.  Remove the name so we can try again.
2951     scope_to_try.erase(old_size);
2952   }
2953 }
2954 
LookupSymbol(const string & name,const string & relative_to,PlaceholderType placeholder_type,ResolveMode resolve_mode)2955 Symbol DescriptorBuilder::LookupSymbol(
2956     const string& name, const string& relative_to,
2957     PlaceholderType placeholder_type, ResolveMode resolve_mode) {
2958   Symbol result = LookupSymbolNoPlaceholder(
2959       name, relative_to, resolve_mode);
2960   if (result.IsNull() && pool_->allow_unknown_) {
2961     // Not found, but AllowUnknownDependencies() is enabled.  Return a
2962     // placeholder instead.
2963     result = NewPlaceholder(name, placeholder_type);
2964   }
2965   return result;
2966 }
2967 
NewPlaceholder(const string & name,PlaceholderType placeholder_type)2968 Symbol DescriptorBuilder::NewPlaceholder(const string& name,
2969                                          PlaceholderType placeholder_type) {
2970   // Compute names.
2971   const string* placeholder_full_name;
2972   const string* placeholder_name;
2973   const string* placeholder_package;
2974 
2975   if (!ValidateQualifiedName(name)) return kNullSymbol;
2976   if (name[0] == '.') {
2977     // Fully-qualified.
2978     placeholder_full_name = tables_->AllocateString(name.substr(1));
2979   } else {
2980     placeholder_full_name = tables_->AllocateString(name);
2981   }
2982 
2983   string::size_type dotpos = placeholder_full_name->find_last_of('.');
2984   if (dotpos != string::npos) {
2985     placeholder_package = tables_->AllocateString(
2986       placeholder_full_name->substr(0, dotpos));
2987     placeholder_name = tables_->AllocateString(
2988       placeholder_full_name->substr(dotpos + 1));
2989   } else {
2990     placeholder_package = &internal::GetEmptyString();
2991     placeholder_name = placeholder_full_name;
2992   }
2993 
2994   // Create the placeholders.
2995   FileDescriptor* placeholder_file = tables_->Allocate<FileDescriptor>();
2996   memset(placeholder_file, 0, sizeof(*placeholder_file));
2997 
2998   placeholder_file->source_code_info_ = &SourceCodeInfo::default_instance();
2999 
3000   placeholder_file->name_ =
3001     tables_->AllocateString(*placeholder_full_name + ".placeholder.proto");
3002   placeholder_file->package_ = placeholder_package;
3003   placeholder_file->pool_ = pool_;
3004   placeholder_file->options_ = &FileOptions::default_instance();
3005   placeholder_file->tables_ = &FileDescriptorTables::kEmpty;
3006   placeholder_file->is_placeholder_ = true;
3007   // All other fields are zero or NULL.
3008 
3009   if (placeholder_type == PLACEHOLDER_ENUM) {
3010     placeholder_file->enum_type_count_ = 1;
3011     placeholder_file->enum_types_ =
3012       tables_->AllocateArray<EnumDescriptor>(1);
3013 
3014     EnumDescriptor* placeholder_enum = &placeholder_file->enum_types_[0];
3015     memset(placeholder_enum, 0, sizeof(*placeholder_enum));
3016 
3017     placeholder_enum->full_name_ = placeholder_full_name;
3018     placeholder_enum->name_ = placeholder_name;
3019     placeholder_enum->file_ = placeholder_file;
3020     placeholder_enum->options_ = &EnumOptions::default_instance();
3021     placeholder_enum->is_placeholder_ = true;
3022     placeholder_enum->is_unqualified_placeholder_ = (name[0] != '.');
3023 
3024     // Enums must have at least one value.
3025     placeholder_enum->value_count_ = 1;
3026     placeholder_enum->values_ = tables_->AllocateArray<EnumValueDescriptor>(1);
3027 
3028     EnumValueDescriptor* placeholder_value = &placeholder_enum->values_[0];
3029     memset(placeholder_value, 0, sizeof(*placeholder_value));
3030 
3031     placeholder_value->name_ = tables_->AllocateString("PLACEHOLDER_VALUE");
3032     // Note that enum value names are siblings of their type, not children.
3033     placeholder_value->full_name_ =
3034       placeholder_package->empty() ? placeholder_value->name_ :
3035         tables_->AllocateString(*placeholder_package + ".PLACEHOLDER_VALUE");
3036 
3037     placeholder_value->number_ = 0;
3038     placeholder_value->type_ = placeholder_enum;
3039     placeholder_value->options_ = &EnumValueOptions::default_instance();
3040 
3041     return Symbol(placeholder_enum);
3042   } else {
3043     placeholder_file->message_type_count_ = 1;
3044     placeholder_file->message_types_ =
3045       tables_->AllocateArray<Descriptor>(1);
3046 
3047     Descriptor* placeholder_message = &placeholder_file->message_types_[0];
3048     memset(placeholder_message, 0, sizeof(*placeholder_message));
3049 
3050     placeholder_message->full_name_ = placeholder_full_name;
3051     placeholder_message->name_ = placeholder_name;
3052     placeholder_message->file_ = placeholder_file;
3053     placeholder_message->options_ = &MessageOptions::default_instance();
3054     placeholder_message->is_placeholder_ = true;
3055     placeholder_message->is_unqualified_placeholder_ = (name[0] != '.');
3056 
3057     if (placeholder_type == PLACEHOLDER_EXTENDABLE_MESSAGE) {
3058       placeholder_message->extension_range_count_ = 1;
3059       placeholder_message->extension_ranges_ =
3060         tables_->AllocateArray<Descriptor::ExtensionRange>(1);
3061       placeholder_message->extension_ranges_->start = 1;
3062       // kMaxNumber + 1 because ExtensionRange::end is exclusive.
3063       placeholder_message->extension_ranges_->end =
3064         FieldDescriptor::kMaxNumber + 1;
3065     }
3066 
3067     return Symbol(placeholder_message);
3068   }
3069 }
3070 
NewPlaceholderFile(const string & name)3071 const FileDescriptor* DescriptorBuilder::NewPlaceholderFile(
3072     const string& name) {
3073   FileDescriptor* placeholder = tables_->Allocate<FileDescriptor>();
3074   memset(placeholder, 0, sizeof(*placeholder));
3075 
3076   placeholder->name_ = tables_->AllocateString(name);
3077   placeholder->package_ = &internal::GetEmptyString();
3078   placeholder->pool_ = pool_;
3079   placeholder->options_ = &FileOptions::default_instance();
3080   placeholder->tables_ = &FileDescriptorTables::kEmpty;
3081   placeholder->is_placeholder_ = true;
3082   // All other fields are zero or NULL.
3083 
3084   return placeholder;
3085 }
3086 
AddSymbol(const string & full_name,const void * parent,const string & name,const Message & proto,Symbol symbol)3087 bool DescriptorBuilder::AddSymbol(
3088     const string& full_name, const void* parent, const string& name,
3089     const Message& proto, Symbol symbol) {
3090   // If the caller passed NULL for the parent, the symbol is at file scope.
3091   // Use its file as the parent instead.
3092   if (parent == NULL) parent = file_;
3093 
3094   if (tables_->AddSymbol(full_name, symbol)) {
3095     if (!file_tables_->AddAliasUnderParent(parent, name, symbol)) {
3096       GOOGLE_LOG(DFATAL) << "\"" << full_name << "\" not previously defined in "
3097                      "symbols_by_name_, but was defined in symbols_by_parent_; "
3098                      "this shouldn't be possible.";
3099       return false;
3100     }
3101     return true;
3102   } else {
3103     const FileDescriptor* other_file = tables_->FindSymbol(full_name).GetFile();
3104     if (other_file == file_) {
3105       string::size_type dot_pos = full_name.find_last_of('.');
3106       if (dot_pos == string::npos) {
3107         AddError(full_name, proto, DescriptorPool::ErrorCollector::NAME,
3108                  "\"" + full_name + "\" is already defined.");
3109       } else {
3110         AddError(full_name, proto, DescriptorPool::ErrorCollector::NAME,
3111                  "\"" + full_name.substr(dot_pos + 1) +
3112                  "\" is already defined in \"" +
3113                  full_name.substr(0, dot_pos) + "\".");
3114       }
3115     } else {
3116       // Symbol seems to have been defined in a different file.
3117       AddError(full_name, proto, DescriptorPool::ErrorCollector::NAME,
3118                "\"" + full_name + "\" is already defined in file \"" +
3119                other_file->name() + "\".");
3120     }
3121     return false;
3122   }
3123 }
3124 
AddPackage(const string & name,const Message & proto,const FileDescriptor * file)3125 void DescriptorBuilder::AddPackage(
3126     const string& name, const Message& proto, const FileDescriptor* file) {
3127   if (tables_->AddSymbol(name, Symbol(file))) {
3128     // Success.  Also add parent package, if any.
3129     string::size_type dot_pos = name.find_last_of('.');
3130     if (dot_pos == string::npos) {
3131       // No parents.
3132       ValidateSymbolName(name, name, proto);
3133     } else {
3134       // Has parent.
3135       string* parent_name = tables_->AllocateString(name.substr(0, dot_pos));
3136       AddPackage(*parent_name, proto, file);
3137       ValidateSymbolName(name.substr(dot_pos + 1), name, proto);
3138     }
3139   } else {
3140     Symbol existing_symbol = tables_->FindSymbol(name);
3141     // It's OK to redefine a package.
3142     if (existing_symbol.type != Symbol::PACKAGE) {
3143       // Symbol seems to have been defined in a different file.
3144       AddError(name, proto, DescriptorPool::ErrorCollector::NAME,
3145                "\"" + name + "\" is already defined (as something other than "
3146                "a package) in file \"" + existing_symbol.GetFile()->name() +
3147                "\".");
3148     }
3149   }
3150 }
3151 
ValidateSymbolName(const string & name,const string & full_name,const Message & proto)3152 void DescriptorBuilder::ValidateSymbolName(
3153     const string& name, const string& full_name, const Message& proto) {
3154   if (name.empty()) {
3155     AddError(full_name, proto, DescriptorPool::ErrorCollector::NAME,
3156              "Missing name.");
3157   } else {
3158     for (int i = 0; i < name.size(); i++) {
3159       // I don't trust isalnum() due to locales.  :(
3160       if ((name[i] < 'a' || 'z' < name[i]) &&
3161           (name[i] < 'A' || 'Z' < name[i]) &&
3162           (name[i] < '0' || '9' < name[i]) &&
3163           (name[i] != '_')) {
3164         AddError(full_name, proto, DescriptorPool::ErrorCollector::NAME,
3165                  "\"" + name + "\" is not a valid identifier.");
3166       }
3167     }
3168   }
3169 }
3170 
ValidateQualifiedName(const string & name)3171 bool DescriptorBuilder::ValidateQualifiedName(const string& name) {
3172   bool last_was_period = false;
3173 
3174   for (int i = 0; i < name.size(); i++) {
3175     // I don't trust isalnum() due to locales.  :(
3176     if (('a' <= name[i] && name[i] <= 'z') ||
3177         ('A' <= name[i] && name[i] <= 'Z') ||
3178         ('0' <= name[i] && name[i] <= '9') ||
3179         (name[i] == '_')) {
3180       last_was_period = false;
3181     } else if (name[i] == '.') {
3182       if (last_was_period) return false;
3183       last_was_period = true;
3184     } else {
3185       return false;
3186     }
3187   }
3188 
3189   return !name.empty() && !last_was_period;
3190 }
3191 
3192 // -------------------------------------------------------------------
3193 
3194 // This generic implementation is good for all descriptors except
3195 // FileDescriptor.
AllocateOptions(const typename DescriptorT::OptionsType & orig_options,DescriptorT * descriptor)3196 template<class DescriptorT> void DescriptorBuilder::AllocateOptions(
3197     const typename DescriptorT::OptionsType& orig_options,
3198     DescriptorT* descriptor) {
3199   AllocateOptionsImpl(descriptor->full_name(), descriptor->full_name(),
3200                       orig_options, descriptor);
3201 }
3202 
3203 // We specialize for FileDescriptor.
AllocateOptions(const FileOptions & orig_options,FileDescriptor * descriptor)3204 void DescriptorBuilder::AllocateOptions(const FileOptions& orig_options,
3205                                         FileDescriptor* descriptor) {
3206   // We add the dummy token so that LookupSymbol does the right thing.
3207   AllocateOptionsImpl(descriptor->package() + ".dummy", descriptor->name(),
3208                       orig_options, descriptor);
3209 }
3210 
AllocateOptionsImpl(const string & name_scope,const string & element_name,const typename DescriptorT::OptionsType & orig_options,DescriptorT * descriptor)3211 template<class DescriptorT> void DescriptorBuilder::AllocateOptionsImpl(
3212     const string& name_scope,
3213     const string& element_name,
3214     const typename DescriptorT::OptionsType& orig_options,
3215     DescriptorT* descriptor) {
3216   // We need to use a dummy pointer to work around a bug in older versions of
3217   // GCC.  Otherwise, the following two lines could be replaced with:
3218   //   typename DescriptorT::OptionsType* options =
3219   //       tables_->AllocateMessage<typename DescriptorT::OptionsType>();
3220   typename DescriptorT::OptionsType* const dummy = NULL;
3221   typename DescriptorT::OptionsType* options = tables_->AllocateMessage(dummy);
3222   // Avoid using MergeFrom()/CopyFrom() in this class to make it -fno-rtti
3223   // friendly. Without RTTI, MergeFrom() and CopyFrom() will fallback to the
3224   // reflection based method, which requires the Descriptor. However, we are in
3225   // the middle of building the descriptors, thus the deadlock.
3226   options->ParseFromString(orig_options.SerializeAsString());
3227   descriptor->options_ = options;
3228 
3229   // Don't add to options_to_interpret_ unless there were uninterpreted
3230   // options.  This not only avoids unnecessary work, but prevents a
3231   // bootstrapping problem when building descriptors for descriptor.proto.
3232   // descriptor.proto does not contain any uninterpreted options, but
3233   // attempting to interpret options anyway will cause
3234   // OptionsType::GetDescriptor() to be called which may then deadlock since
3235   // we're still trying to build it.
3236   if (options->uninterpreted_option_size() > 0) {
3237     options_to_interpret_.push_back(
3238         OptionsToInterpret(name_scope, element_name, &orig_options, options));
3239   }
3240 }
3241 
3242 
3243 // A common pattern:  We want to convert a repeated field in the descriptor
3244 // to an array of values, calling some method to build each value.
3245 #define BUILD_ARRAY(INPUT, OUTPUT, NAME, METHOD, PARENT)             \
3246   OUTPUT->NAME##_count_ = INPUT.NAME##_size();                       \
3247   AllocateArray(INPUT.NAME##_size(), &OUTPUT->NAME##s_);             \
3248   for (int i = 0; i < INPUT.NAME##_size(); i++) {                    \
3249     METHOD(INPUT.NAME(i), PARENT, OUTPUT->NAME##s_ + i);             \
3250   }
3251 
AddRecursiveImportError(const FileDescriptorProto & proto,int from_here)3252 void DescriptorBuilder::AddRecursiveImportError(
3253     const FileDescriptorProto& proto, int from_here) {
3254   string error_message("File recursively imports itself: ");
3255   for (int i = from_here; i < tables_->pending_files_.size(); i++) {
3256     error_message.append(tables_->pending_files_[i]);
3257     error_message.append(" -> ");
3258   }
3259   error_message.append(proto.name());
3260 
3261   AddError(proto.name(), proto, DescriptorPool::ErrorCollector::OTHER,
3262            error_message);
3263 }
3264 
AddTwiceListedError(const FileDescriptorProto & proto,int index)3265 void DescriptorBuilder::AddTwiceListedError(const FileDescriptorProto& proto,
3266                                             int index) {
3267   AddError(proto.name(), proto, DescriptorPool::ErrorCollector::OTHER,
3268            "Import \"" + proto.dependency(index) + "\" was listed twice.");
3269 }
3270 
AddImportError(const FileDescriptorProto & proto,int index)3271 void DescriptorBuilder::AddImportError(const FileDescriptorProto& proto,
3272                                        int index) {
3273   string message;
3274   if (pool_->fallback_database_ == NULL) {
3275     message = "Import \"" + proto.dependency(index) +
3276               "\" has not been loaded.";
3277   } else {
3278     message = "Import \"" + proto.dependency(index) +
3279               "\" was not found or had errors.";
3280   }
3281   AddError(proto.name(), proto, DescriptorPool::ErrorCollector::OTHER, message);
3282 }
3283 
ExistingFileMatchesProto(const FileDescriptor * existing_file,const FileDescriptorProto & proto)3284 static bool ExistingFileMatchesProto(const FileDescriptor* existing_file,
3285                                      const FileDescriptorProto& proto) {
3286   FileDescriptorProto existing_proto;
3287   existing_file->CopyTo(&existing_proto);
3288   return existing_proto.SerializeAsString() == proto.SerializeAsString();
3289 }
3290 
BuildFile(const FileDescriptorProto & proto)3291 const FileDescriptor* DescriptorBuilder::BuildFile(
3292     const FileDescriptorProto& proto) {
3293   filename_ = proto.name();
3294 
3295   // Check if the file already exists and is identical to the one being built.
3296   // Note:  This only works if the input is canonical -- that is, it
3297   //   fully-qualifies all type names, has no UninterpretedOptions, etc.
3298   //   This is fine, because this idempotency "feature" really only exists to
3299   //   accomodate one hack in the proto1->proto2 migration layer.
3300   const FileDescriptor* existing_file = tables_->FindFile(filename_);
3301   if (existing_file != NULL) {
3302     // File already in pool.  Compare the existing one to the input.
3303     if (ExistingFileMatchesProto(existing_file, proto)) {
3304       // They're identical.  Return the existing descriptor.
3305       return existing_file;
3306     }
3307 
3308     // Not a match.  The error will be detected and handled later.
3309   }
3310 
3311   // Check to see if this file is already on the pending files list.
3312   // TODO(kenton):  Allow recursive imports?  It may not work with some
3313   //   (most?) programming languages.  E.g., in C++, a forward declaration
3314   //   of a type is not sufficient to allow it to be used even in a
3315   //   generated header file due to inlining.  This could perhaps be
3316   //   worked around using tricks involving inserting #include statements
3317   //   mid-file, but that's pretty ugly, and I'm pretty sure there are
3318   //   some languages out there that do not allow recursive dependencies
3319   //   at all.
3320   for (int i = 0; i < tables_->pending_files_.size(); i++) {
3321     if (tables_->pending_files_[i] == proto.name()) {
3322       AddRecursiveImportError(proto, i);
3323       return NULL;
3324     }
3325   }
3326 
3327   // If we have a fallback_database_, attempt to load all dependencies now,
3328   // before checkpointing tables_.  This avoids confusion with recursive
3329   // checkpoints.
3330   if (pool_->fallback_database_ != NULL) {
3331     tables_->pending_files_.push_back(proto.name());
3332     for (int i = 0; i < proto.dependency_size(); i++) {
3333       if (tables_->FindFile(proto.dependency(i)) == NULL &&
3334           (pool_->underlay_ == NULL ||
3335            pool_->underlay_->FindFileByName(proto.dependency(i)) == NULL)) {
3336         // We don't care what this returns since we'll find out below anyway.
3337         pool_->TryFindFileInFallbackDatabase(proto.dependency(i));
3338       }
3339     }
3340     tables_->pending_files_.pop_back();
3341   }
3342 
3343   // Checkpoint the tables so that we can roll back if something goes wrong.
3344   tables_->AddCheckpoint();
3345 
3346   FileDescriptor* result = tables_->Allocate<FileDescriptor>();
3347   file_ = result;
3348 
3349   result->is_placeholder_ = false;
3350   if (proto.has_source_code_info()) {
3351     SourceCodeInfo *info = tables_->AllocateMessage<SourceCodeInfo>();
3352     info->CopyFrom(proto.source_code_info());
3353     result->source_code_info_ = info;
3354   } else {
3355     result->source_code_info_ = &SourceCodeInfo::default_instance();
3356   }
3357 
3358   file_tables_ = tables_->AllocateFileTables();
3359   file_->tables_ = file_tables_;
3360 
3361   if (!proto.has_name()) {
3362     AddError("", proto, DescriptorPool::ErrorCollector::OTHER,
3363              "Missing field: FileDescriptorProto.name.");
3364   }
3365 
3366   result->name_ = tables_->AllocateString(proto.name());
3367   if (proto.has_package()) {
3368     result->package_ = tables_->AllocateString(proto.package());
3369   } else {
3370     // We cannot rely on proto.package() returning a valid string if
3371     // proto.has_package() is false, because we might be running at static
3372     // initialization time, in which case default values have not yet been
3373     // initialized.
3374     result->package_ = tables_->AllocateString("");
3375   }
3376   result->pool_ = pool_;
3377 
3378   // Add to tables.
3379   if (!tables_->AddFile(result)) {
3380     AddError(proto.name(), proto, DescriptorPool::ErrorCollector::OTHER,
3381              "A file with this name is already in the pool.");
3382     // Bail out early so that if this is actually the exact same file, we
3383     // don't end up reporting that every single symbol is already defined.
3384     tables_->RollbackToLastCheckpoint();
3385     return NULL;
3386   }
3387   if (!result->package().empty()) {
3388     AddPackage(result->package(), proto, result);
3389   }
3390 
3391   // Make sure all dependencies are loaded.
3392   set<string> seen_dependencies;
3393   result->dependency_count_ = proto.dependency_size();
3394   result->dependencies_ =
3395     tables_->AllocateArray<const FileDescriptor*>(proto.dependency_size());
3396   unused_dependency_.clear();
3397   set<int> weak_deps;
3398   for (int i = 0; i < proto.weak_dependency_size(); ++i) {
3399     weak_deps.insert(proto.weak_dependency(i));
3400   }
3401   for (int i = 0; i < proto.dependency_size(); i++) {
3402     if (!seen_dependencies.insert(proto.dependency(i)).second) {
3403       AddTwiceListedError(proto, i);
3404     }
3405 
3406     const FileDescriptor* dependency = tables_->FindFile(proto.dependency(i));
3407     if (dependency == NULL && pool_->underlay_ != NULL) {
3408       dependency = pool_->underlay_->FindFileByName(proto.dependency(i));
3409     }
3410 
3411     if (dependency == NULL) {
3412       if (pool_->allow_unknown_ ||
3413           (!pool_->enforce_weak_ && weak_deps.find(i) != weak_deps.end())) {
3414         dependency = NewPlaceholderFile(proto.dependency(i));
3415       } else {
3416         AddImportError(proto, i);
3417       }
3418     } else {
3419       // Add to unused_dependency_ to track unused imported files.
3420       // Note: do not track unused imported files for public import.
3421       if (pool_->enforce_dependencies_ &&
3422           (pool_->unused_import_track_files_.find(proto.name()) !=
3423            pool_->unused_import_track_files_.end()) &&
3424           (dependency->public_dependency_count() == 0)) {
3425         unused_dependency_.insert(dependency);
3426       }
3427     }
3428 
3429     result->dependencies_[i] = dependency;
3430   }
3431 
3432   // Check public dependencies.
3433   int public_dependency_count = 0;
3434   result->public_dependencies_ = tables_->AllocateArray<int>(
3435       proto.public_dependency_size());
3436   for (int i = 0; i < proto.public_dependency_size(); i++) {
3437     // Only put valid public dependency indexes.
3438     int index = proto.public_dependency(i);
3439     if (index >= 0 && index < proto.dependency_size()) {
3440       result->public_dependencies_[public_dependency_count++] = index;
3441       // Do not track unused imported files for public import.
3442       unused_dependency_.erase(result->dependency(index));
3443     } else {
3444       AddError(proto.name(), proto,
3445                DescriptorPool::ErrorCollector::OTHER,
3446                "Invalid public dependency index.");
3447     }
3448   }
3449   result->public_dependency_count_ = public_dependency_count;
3450 
3451   // Build dependency set
3452   dependencies_.clear();
3453   for (int i = 0; i < result->dependency_count(); i++) {
3454     RecordPublicDependencies(result->dependency(i));
3455   }
3456 
3457   // Check weak dependencies.
3458   int weak_dependency_count = 0;
3459   result->weak_dependencies_ = tables_->AllocateArray<int>(
3460       proto.weak_dependency_size());
3461   for (int i = 0; i < proto.weak_dependency_size(); i++) {
3462     int index = proto.weak_dependency(i);
3463     if (index >= 0 && index < proto.dependency_size()) {
3464       result->weak_dependencies_[weak_dependency_count++] = index;
3465     } else {
3466       AddError(proto.name(), proto,
3467                DescriptorPool::ErrorCollector::OTHER,
3468                "Invalid weak dependency index.");
3469     }
3470   }
3471   result->weak_dependency_count_ = weak_dependency_count;
3472 
3473   // Convert children.
3474   BUILD_ARRAY(proto, result, message_type, BuildMessage  , NULL);
3475   BUILD_ARRAY(proto, result, enum_type   , BuildEnum     , NULL);
3476   BUILD_ARRAY(proto, result, service     , BuildService  , NULL);
3477   BUILD_ARRAY(proto, result, extension   , BuildExtension, NULL);
3478 
3479   // Copy options.
3480   if (!proto.has_options()) {
3481     result->options_ = NULL;  // Will set to default_instance later.
3482   } else {
3483     AllocateOptions(proto.options(), result);
3484   }
3485 
3486   // Note that the following steps must occur in exactly the specified order.
3487 
3488   // Cross-link.
3489   CrossLinkFile(result, proto);
3490 
3491   // Interpret any remaining uninterpreted options gathered into
3492   // options_to_interpret_ during descriptor building.  Cross-linking has made
3493   // extension options known, so all interpretations should now succeed.
3494   if (!had_errors_) {
3495     OptionInterpreter option_interpreter(this);
3496     for (vector<OptionsToInterpret>::iterator iter =
3497              options_to_interpret_.begin();
3498          iter != options_to_interpret_.end(); ++iter) {
3499       option_interpreter.InterpretOptions(&(*iter));
3500     }
3501     options_to_interpret_.clear();
3502   }
3503 
3504   // Validate options.
3505   if (!had_errors_) {
3506     ValidateFileOptions(result, proto);
3507   }
3508 
3509 
3510   if (!unused_dependency_.empty()) {
3511     LogUnusedDependency(result);
3512   }
3513 
3514   if (had_errors_) {
3515     tables_->RollbackToLastCheckpoint();
3516     return NULL;
3517   } else {
3518     tables_->ClearLastCheckpoint();
3519     return result;
3520   }
3521 }
3522 
BuildMessage(const DescriptorProto & proto,const Descriptor * parent,Descriptor * result)3523 void DescriptorBuilder::BuildMessage(const DescriptorProto& proto,
3524                                      const Descriptor* parent,
3525                                      Descriptor* result) {
3526   const string& scope = (parent == NULL) ?
3527     file_->package() : parent->full_name();
3528   string* full_name = tables_->AllocateString(scope);
3529   if (!full_name->empty()) full_name->append(1, '.');
3530   full_name->append(proto.name());
3531 
3532   ValidateSymbolName(proto.name(), *full_name, proto);
3533 
3534   result->name_            = tables_->AllocateString(proto.name());
3535   result->full_name_       = full_name;
3536   result->file_            = file_;
3537   result->containing_type_ = parent;
3538   result->is_placeholder_  = false;
3539   result->is_unqualified_placeholder_ = false;
3540 
3541   // Build oneofs first so that fields and extension ranges can refer to them.
3542   BUILD_ARRAY(proto, result, oneof_decl     , BuildOneof         , result);
3543   BUILD_ARRAY(proto, result, field          , BuildField         , result);
3544   BUILD_ARRAY(proto, result, nested_type    , BuildMessage       , result);
3545   BUILD_ARRAY(proto, result, enum_type      , BuildEnum          , result);
3546   BUILD_ARRAY(proto, result, extension_range, BuildExtensionRange, result);
3547   BUILD_ARRAY(proto, result, extension      , BuildExtension     , result);
3548 
3549   // Copy options.
3550   if (!proto.has_options()) {
3551     result->options_ = NULL;  // Will set to default_instance later.
3552   } else {
3553     AllocateOptions(proto.options(), result);
3554   }
3555 
3556   AddSymbol(result->full_name(), parent, result->name(),
3557             proto, Symbol(result));
3558 
3559   // Check that no fields have numbers in extension ranges.
3560   for (int i = 0; i < result->field_count(); i++) {
3561     const FieldDescriptor* field = result->field(i);
3562     for (int j = 0; j < result->extension_range_count(); j++) {
3563       const Descriptor::ExtensionRange* range = result->extension_range(j);
3564       if (range->start <= field->number() && field->number() < range->end) {
3565         AddError(field->full_name(), proto.extension_range(j),
3566                  DescriptorPool::ErrorCollector::NUMBER,
3567                  strings::Substitute(
3568                    "Extension range $0 to $1 includes field \"$2\" ($3).",
3569                    range->start, range->end - 1,
3570                    field->name(), field->number()));
3571       }
3572     }
3573   }
3574 
3575   // Check that extension ranges don't overlap.
3576   for (int i = 0; i < result->extension_range_count(); i++) {
3577     const Descriptor::ExtensionRange* range1 = result->extension_range(i);
3578     for (int j = i + 1; j < result->extension_range_count(); j++) {
3579       const Descriptor::ExtensionRange* range2 = result->extension_range(j);
3580       if (range1->end > range2->start && range2->end > range1->start) {
3581         AddError(result->full_name(), proto.extension_range(j),
3582                  DescriptorPool::ErrorCollector::NUMBER,
3583                  strings::Substitute("Extension range $0 to $1 overlaps with "
3584                                      "already-defined range $2 to $3.",
3585                                      range2->start, range2->end - 1,
3586                                      range1->start, range1->end - 1));
3587       }
3588     }
3589   }
3590 }
3591 
BuildFieldOrExtension(const FieldDescriptorProto & proto,const Descriptor * parent,FieldDescriptor * result,bool is_extension)3592 void DescriptorBuilder::BuildFieldOrExtension(const FieldDescriptorProto& proto,
3593                                               const Descriptor* parent,
3594                                               FieldDescriptor* result,
3595                                               bool is_extension) {
3596   const string& scope = (parent == NULL) ?
3597     file_->package() : parent->full_name();
3598   string* full_name = tables_->AllocateString(scope);
3599   if (!full_name->empty()) full_name->append(1, '.');
3600   full_name->append(proto.name());
3601 
3602   ValidateSymbolName(proto.name(), *full_name, proto);
3603 
3604   result->name_         = tables_->AllocateString(proto.name());
3605   result->full_name_    = full_name;
3606   result->file_         = file_;
3607   result->number_       = proto.number();
3608   result->is_extension_ = is_extension;
3609 
3610   // If .proto files follow the style guide then the name should already be
3611   // lower-cased.  If that's the case we can just reuse the string we already
3612   // allocated rather than allocate a new one.
3613   string lowercase_name(proto.name());
3614   LowerString(&lowercase_name);
3615   if (lowercase_name == proto.name()) {
3616     result->lowercase_name_ = result->name_;
3617   } else {
3618     result->lowercase_name_ = tables_->AllocateString(lowercase_name);
3619   }
3620 
3621   // Don't bother with the above optimization for camel-case names since
3622   // .proto files that follow the guide shouldn't be using names in this
3623   // format, so the optimization wouldn't help much.
3624   result->camelcase_name_ = tables_->AllocateString(ToCamelCase(proto.name()));
3625 
3626   // Some compilers do not allow static_cast directly between two enum types,
3627   // so we must cast to int first.
3628   result->type_  = static_cast<FieldDescriptor::Type>(
3629                      implicit_cast<int>(proto.type()));
3630   result->label_ = static_cast<FieldDescriptor::Label>(
3631                      implicit_cast<int>(proto.label()));
3632 
3633   // An extension cannot have a required field (b/13365836).
3634   if (result->is_extension_ &&
3635       result->label_ == FieldDescriptor::LABEL_REQUIRED) {
3636     AddError(result->full_name(), proto,
3637              // Error location `TYPE`: we would really like to indicate
3638              // `LABEL`, but the `ErrorLocation` enum has no entry for this, and
3639              // we don't necessarily know about all implementations of the
3640              // `ErrorCollector` interface to extend them to handle the new
3641              // error location type properly.
3642              DescriptorPool::ErrorCollector::TYPE,
3643              "Message extensions cannot have required fields.");
3644   }
3645 
3646   // Some of these may be filled in when cross-linking.
3647   result->containing_type_ = NULL;
3648   result->extension_scope_ = NULL;
3649   result->experimental_map_key_ = NULL;
3650   result->message_type_ = NULL;
3651   result->enum_type_ = NULL;
3652 
3653   result->has_default_value_ = proto.has_default_value();
3654   if (proto.has_default_value() && result->is_repeated()) {
3655     AddError(result->full_name(), proto,
3656              DescriptorPool::ErrorCollector::DEFAULT_VALUE,
3657              "Repeated fields can't have default values.");
3658   }
3659 
3660   if (proto.has_type()) {
3661     if (proto.has_default_value()) {
3662       char* end_pos = NULL;
3663       switch (result->cpp_type()) {
3664         case FieldDescriptor::CPPTYPE_INT32:
3665           result->default_value_int32_ =
3666             strtol(proto.default_value().c_str(), &end_pos, 0);
3667           break;
3668         case FieldDescriptor::CPPTYPE_INT64:
3669           result->default_value_int64_ =
3670             strto64(proto.default_value().c_str(), &end_pos, 0);
3671           break;
3672         case FieldDescriptor::CPPTYPE_UINT32:
3673           result->default_value_uint32_ =
3674             strtoul(proto.default_value().c_str(), &end_pos, 0);
3675           break;
3676         case FieldDescriptor::CPPTYPE_UINT64:
3677           result->default_value_uint64_ =
3678             strtou64(proto.default_value().c_str(), &end_pos, 0);
3679           break;
3680         case FieldDescriptor::CPPTYPE_FLOAT:
3681           if (proto.default_value() == "inf") {
3682             result->default_value_float_ = numeric_limits<float>::infinity();
3683           } else if (proto.default_value() == "-inf") {
3684             result->default_value_float_ = -numeric_limits<float>::infinity();
3685           } else if (proto.default_value() == "nan") {
3686             result->default_value_float_ = numeric_limits<float>::quiet_NaN();
3687           } else  {
3688             result->default_value_float_ =
3689               io::NoLocaleStrtod(proto.default_value().c_str(), &end_pos);
3690           }
3691           break;
3692         case FieldDescriptor::CPPTYPE_DOUBLE:
3693           if (proto.default_value() == "inf") {
3694             result->default_value_double_ = numeric_limits<double>::infinity();
3695           } else if (proto.default_value() == "-inf") {
3696             result->default_value_double_ = -numeric_limits<double>::infinity();
3697           } else if (proto.default_value() == "nan") {
3698             result->default_value_double_ = numeric_limits<double>::quiet_NaN();
3699           } else  {
3700             result->default_value_double_ =
3701                 io::NoLocaleStrtod(proto.default_value().c_str(), &end_pos);
3702           }
3703           break;
3704         case FieldDescriptor::CPPTYPE_BOOL:
3705           if (proto.default_value() == "true") {
3706             result->default_value_bool_ = true;
3707           } else if (proto.default_value() == "false") {
3708             result->default_value_bool_ = false;
3709           } else {
3710             AddError(result->full_name(), proto,
3711                      DescriptorPool::ErrorCollector::DEFAULT_VALUE,
3712                      "Boolean default must be true or false.");
3713           }
3714           break;
3715         case FieldDescriptor::CPPTYPE_ENUM:
3716           // This will be filled in when cross-linking.
3717           result->default_value_enum_ = NULL;
3718           break;
3719         case FieldDescriptor::CPPTYPE_STRING:
3720           if (result->type() == FieldDescriptor::TYPE_BYTES) {
3721             result->default_value_string_ = tables_->AllocateString(
3722               UnescapeCEscapeString(proto.default_value()));
3723           } else {
3724             result->default_value_string_ =
3725                 tables_->AllocateString(proto.default_value());
3726           }
3727           break;
3728         case FieldDescriptor::CPPTYPE_MESSAGE:
3729           AddError(result->full_name(), proto,
3730                    DescriptorPool::ErrorCollector::DEFAULT_VALUE,
3731                    "Messages can't have default values.");
3732           result->has_default_value_ = false;
3733           break;
3734       }
3735 
3736       if (end_pos != NULL) {
3737         // end_pos is only set non-NULL by the parsers for numeric types, above.
3738         // This checks that the default was non-empty and had no extra junk
3739         // after the end of the number.
3740         if (proto.default_value().empty() || *end_pos != '\0') {
3741           AddError(result->full_name(), proto,
3742                    DescriptorPool::ErrorCollector::DEFAULT_VALUE,
3743                    "Couldn't parse default value \"" + proto.default_value() +
3744                    "\".");
3745         }
3746       }
3747     } else {
3748       // No explicit default value
3749       switch (result->cpp_type()) {
3750         case FieldDescriptor::CPPTYPE_INT32:
3751           result->default_value_int32_ = 0;
3752           break;
3753         case FieldDescriptor::CPPTYPE_INT64:
3754           result->default_value_int64_ = 0;
3755           break;
3756         case FieldDescriptor::CPPTYPE_UINT32:
3757           result->default_value_uint32_ = 0;
3758           break;
3759         case FieldDescriptor::CPPTYPE_UINT64:
3760           result->default_value_uint64_ = 0;
3761           break;
3762         case FieldDescriptor::CPPTYPE_FLOAT:
3763           result->default_value_float_ = 0.0f;
3764           break;
3765         case FieldDescriptor::CPPTYPE_DOUBLE:
3766           result->default_value_double_ = 0.0;
3767           break;
3768         case FieldDescriptor::CPPTYPE_BOOL:
3769           result->default_value_bool_ = false;
3770           break;
3771         case FieldDescriptor::CPPTYPE_ENUM:
3772           // This will be filled in when cross-linking.
3773           result->default_value_enum_ = NULL;
3774           break;
3775         case FieldDescriptor::CPPTYPE_STRING:
3776           result->default_value_string_ = &internal::GetEmptyString();
3777           break;
3778         case FieldDescriptor::CPPTYPE_MESSAGE:
3779           break;
3780       }
3781     }
3782   }
3783 
3784   if (result->number() <= 0) {
3785     AddError(result->full_name(), proto, DescriptorPool::ErrorCollector::NUMBER,
3786              "Field numbers must be positive integers.");
3787   } else if (!is_extension && result->number() > FieldDescriptor::kMaxNumber) {
3788     // Only validate that the number is within the valid field range if it is
3789     // not an extension. Since extension numbers are validated with the
3790     // extendee's valid set of extension numbers, and those are in turn
3791     // validated against the max allowed number, the check is unnecessary for
3792     // extension fields.
3793     // This avoids cross-linking issues that arise when attempting to check if
3794     // the extendee is a message_set_wire_format message, which has a higher max
3795     // on extension numbers.
3796     AddError(result->full_name(), proto, DescriptorPool::ErrorCollector::NUMBER,
3797              strings::Substitute("Field numbers cannot be greater than $0.",
3798                                  FieldDescriptor::kMaxNumber));
3799   } else if (result->number() >= FieldDescriptor::kFirstReservedNumber &&
3800              result->number() <= FieldDescriptor::kLastReservedNumber) {
3801     AddError(result->full_name(), proto, DescriptorPool::ErrorCollector::NUMBER,
3802              strings::Substitute(
3803                "Field numbers $0 through $1 are reserved for the protocol "
3804                "buffer library implementation.",
3805                FieldDescriptor::kFirstReservedNumber,
3806                FieldDescriptor::kLastReservedNumber));
3807   }
3808 
3809   if (is_extension) {
3810     if (!proto.has_extendee()) {
3811       AddError(result->full_name(), proto,
3812                DescriptorPool::ErrorCollector::EXTENDEE,
3813                "FieldDescriptorProto.extendee not set for extension field.");
3814     }
3815 
3816     result->extension_scope_ = parent;
3817 
3818     if (proto.has_oneof_index()) {
3819       AddError(result->full_name(), proto,
3820                DescriptorPool::ErrorCollector::OTHER,
3821                "FieldDescriptorProto.oneof_index should not be set for "
3822                "extensions.");
3823     }
3824 
3825     // Fill in later (maybe).
3826     result->containing_oneof_ = NULL;
3827   } else {
3828     if (proto.has_extendee()) {
3829       AddError(result->full_name(), proto,
3830                DescriptorPool::ErrorCollector::EXTENDEE,
3831                "FieldDescriptorProto.extendee set for non-extension field.");
3832     }
3833 
3834     result->containing_type_ = parent;
3835 
3836     if (proto.has_oneof_index()) {
3837       if (proto.oneof_index() < 0 ||
3838           proto.oneof_index() >= parent->oneof_decl_count()) {
3839         AddError(result->full_name(), proto,
3840                  DescriptorPool::ErrorCollector::OTHER,
3841                  strings::Substitute("FieldDescriptorProto.oneof_index $0 is "
3842                                      "out of range for type \"$1\".",
3843                                      proto.oneof_index(),
3844                                      parent->name()));
3845         result->containing_oneof_ = NULL;
3846       } else {
3847         result->containing_oneof_ = parent->oneof_decl(proto.oneof_index());
3848       }
3849     } else {
3850       result->containing_oneof_ = NULL;
3851     }
3852   }
3853 
3854   // Copy options.
3855   if (!proto.has_options()) {
3856     result->options_ = NULL;  // Will set to default_instance later.
3857   } else {
3858     AllocateOptions(proto.options(), result);
3859   }
3860 
3861   AddSymbol(result->full_name(), parent, result->name(),
3862             proto, Symbol(result));
3863 }
3864 
BuildExtensionRange(const DescriptorProto::ExtensionRange & proto,const Descriptor * parent,Descriptor::ExtensionRange * result)3865 void DescriptorBuilder::BuildExtensionRange(
3866     const DescriptorProto::ExtensionRange& proto,
3867     const Descriptor* parent,
3868     Descriptor::ExtensionRange* result) {
3869   result->start = proto.start();
3870   result->end = proto.end();
3871   if (result->start <= 0) {
3872     AddError(parent->full_name(), proto,
3873              DescriptorPool::ErrorCollector::NUMBER,
3874              "Extension numbers must be positive integers.");
3875   }
3876 
3877   // Checking of the upper bound of the extension range is deferred until after
3878   // options interpreting. This allows messages with message_set_wire_format to
3879   // have extensions beyond FieldDescriptor::kMaxNumber, since the extension
3880   // numbers are actually used as int32s in the message_set_wire_format.
3881 
3882   if (result->start >= result->end) {
3883     AddError(parent->full_name(), proto,
3884              DescriptorPool::ErrorCollector::NUMBER,
3885              "Extension range end number must be greater than start number.");
3886   }
3887 }
3888 
BuildOneof(const OneofDescriptorProto & proto,Descriptor * parent,OneofDescriptor * result)3889 void DescriptorBuilder::BuildOneof(const OneofDescriptorProto& proto,
3890                                    Descriptor* parent,
3891                                    OneofDescriptor* result) {
3892   string* full_name = tables_->AllocateString(parent->full_name());
3893   full_name->append(1, '.');
3894   full_name->append(proto.name());
3895 
3896   ValidateSymbolName(proto.name(), *full_name, proto);
3897 
3898   result->name_ = tables_->AllocateString(proto.name());
3899   result->full_name_ = full_name;
3900 
3901   result->containing_type_ = parent;
3902 
3903   // We need to fill these in later.
3904   result->field_count_ = 0;
3905   result->fields_ = NULL;
3906 
3907   AddSymbol(result->full_name(), parent, result->name(),
3908             proto, Symbol(result));
3909 }
3910 
BuildEnum(const EnumDescriptorProto & proto,const Descriptor * parent,EnumDescriptor * result)3911 void DescriptorBuilder::BuildEnum(const EnumDescriptorProto& proto,
3912                                   const Descriptor* parent,
3913                                   EnumDescriptor* result) {
3914   const string& scope = (parent == NULL) ?
3915     file_->package() : parent->full_name();
3916   string* full_name = tables_->AllocateString(scope);
3917   if (!full_name->empty()) full_name->append(1, '.');
3918   full_name->append(proto.name());
3919 
3920   ValidateSymbolName(proto.name(), *full_name, proto);
3921 
3922   result->name_            = tables_->AllocateString(proto.name());
3923   result->full_name_       = full_name;
3924   result->file_            = file_;
3925   result->containing_type_ = parent;
3926   result->is_placeholder_  = false;
3927   result->is_unqualified_placeholder_ = false;
3928 
3929   if (proto.value_size() == 0) {
3930     // We cannot allow enums with no values because this would mean there
3931     // would be no valid default value for fields of this type.
3932     AddError(result->full_name(), proto,
3933              DescriptorPool::ErrorCollector::NAME,
3934              "Enums must contain at least one value.");
3935   }
3936 
3937   BUILD_ARRAY(proto, result, value, BuildEnumValue, result);
3938 
3939   // Copy options.
3940   if (!proto.has_options()) {
3941     result->options_ = NULL;  // Will set to default_instance later.
3942   } else {
3943     AllocateOptions(proto.options(), result);
3944   }
3945 
3946   AddSymbol(result->full_name(), parent, result->name(),
3947             proto, Symbol(result));
3948 }
3949 
BuildEnumValue(const EnumValueDescriptorProto & proto,const EnumDescriptor * parent,EnumValueDescriptor * result)3950 void DescriptorBuilder::BuildEnumValue(const EnumValueDescriptorProto& proto,
3951                                        const EnumDescriptor* parent,
3952                                        EnumValueDescriptor* result) {
3953   result->name_   = tables_->AllocateString(proto.name());
3954   result->number_ = proto.number();
3955   result->type_   = parent;
3956 
3957   // Note:  full_name for enum values is a sibling to the parent's name, not a
3958   //   child of it.
3959   string* full_name = tables_->AllocateString(*parent->full_name_);
3960   full_name->resize(full_name->size() - parent->name_->size());
3961   full_name->append(*result->name_);
3962   result->full_name_ = full_name;
3963 
3964   ValidateSymbolName(proto.name(), *full_name, proto);
3965 
3966   // Copy options.
3967   if (!proto.has_options()) {
3968     result->options_ = NULL;  // Will set to default_instance later.
3969   } else {
3970     AllocateOptions(proto.options(), result);
3971   }
3972 
3973   // Again, enum values are weird because we makes them appear as siblings
3974   // of the enum type instead of children of it.  So, we use
3975   // parent->containing_type() as the value's parent.
3976   bool added_to_outer_scope =
3977     AddSymbol(result->full_name(), parent->containing_type(), result->name(),
3978               proto, Symbol(result));
3979 
3980   // However, we also want to be able to search for values within a single
3981   // enum type, so we add it as a child of the enum type itself, too.
3982   // Note:  This could fail, but if it does, the error has already been
3983   //   reported by the above AddSymbol() call, so we ignore the return code.
3984   bool added_to_inner_scope =
3985     file_tables_->AddAliasUnderParent(parent, result->name(), Symbol(result));
3986 
3987   if (added_to_inner_scope && !added_to_outer_scope) {
3988     // This value did not conflict with any values defined in the same enum,
3989     // but it did conflict with some other symbol defined in the enum type's
3990     // scope.  Let's print an additional error to explain this.
3991     string outer_scope;
3992     if (parent->containing_type() == NULL) {
3993       outer_scope = file_->package();
3994     } else {
3995       outer_scope = parent->containing_type()->full_name();
3996     }
3997 
3998     if (outer_scope.empty()) {
3999       outer_scope = "the global scope";
4000     } else {
4001       outer_scope = "\"" + outer_scope + "\"";
4002     }
4003 
4004     AddError(result->full_name(), proto,
4005              DescriptorPool::ErrorCollector::NAME,
4006              "Note that enum values use C++ scoping rules, meaning that "
4007              "enum values are siblings of their type, not children of it.  "
4008              "Therefore, \"" + result->name() + "\" must be unique within "
4009              + outer_scope + ", not just within \"" + parent->name() + "\".");
4010   }
4011 
4012   // An enum is allowed to define two numbers that refer to the same value.
4013   // FindValueByNumber() should return the first such value, so we simply
4014   // ignore AddEnumValueByNumber()'s return code.
4015   file_tables_->AddEnumValueByNumber(result);
4016 }
4017 
BuildService(const ServiceDescriptorProto & proto,const void *,ServiceDescriptor * result)4018 void DescriptorBuilder::BuildService(const ServiceDescriptorProto& proto,
4019                                      const void* /* dummy */,
4020                                      ServiceDescriptor* result) {
4021   string* full_name = tables_->AllocateString(file_->package());
4022   if (!full_name->empty()) full_name->append(1, '.');
4023   full_name->append(proto.name());
4024 
4025   ValidateSymbolName(proto.name(), *full_name, proto);
4026 
4027   result->name_      = tables_->AllocateString(proto.name());
4028   result->full_name_ = full_name;
4029   result->file_      = file_;
4030 
4031   BUILD_ARRAY(proto, result, method, BuildMethod, result);
4032 
4033   // Copy options.
4034   if (!proto.has_options()) {
4035     result->options_ = NULL;  // Will set to default_instance later.
4036   } else {
4037     AllocateOptions(proto.options(), result);
4038   }
4039 
4040   AddSymbol(result->full_name(), NULL, result->name(),
4041             proto, Symbol(result));
4042 }
4043 
BuildMethod(const MethodDescriptorProto & proto,const ServiceDescriptor * parent,MethodDescriptor * result)4044 void DescriptorBuilder::BuildMethod(const MethodDescriptorProto& proto,
4045                                     const ServiceDescriptor* parent,
4046                                     MethodDescriptor* result) {
4047   result->name_    = tables_->AllocateString(proto.name());
4048   result->service_ = parent;
4049 
4050   string* full_name = tables_->AllocateString(parent->full_name());
4051   full_name->append(1, '.');
4052   full_name->append(*result->name_);
4053   result->full_name_ = full_name;
4054 
4055   ValidateSymbolName(proto.name(), *full_name, proto);
4056 
4057   // These will be filled in when cross-linking.
4058   result->input_type_ = NULL;
4059   result->output_type_ = NULL;
4060 
4061   // Copy options.
4062   if (!proto.has_options()) {
4063     result->options_ = NULL;  // Will set to default_instance later.
4064   } else {
4065     AllocateOptions(proto.options(), result);
4066   }
4067 
4068   AddSymbol(result->full_name(), parent, result->name(),
4069             proto, Symbol(result));
4070 }
4071 
4072 #undef BUILD_ARRAY
4073 
4074 // -------------------------------------------------------------------
4075 
CrossLinkFile(FileDescriptor * file,const FileDescriptorProto & proto)4076 void DescriptorBuilder::CrossLinkFile(
4077     FileDescriptor* file, const FileDescriptorProto& proto) {
4078   if (file->options_ == NULL) {
4079     file->options_ = &FileOptions::default_instance();
4080   }
4081 
4082   for (int i = 0; i < file->message_type_count(); i++) {
4083     CrossLinkMessage(&file->message_types_[i], proto.message_type(i));
4084   }
4085 
4086   for (int i = 0; i < file->extension_count(); i++) {
4087     CrossLinkField(&file->extensions_[i], proto.extension(i));
4088   }
4089 
4090   for (int i = 0; i < file->enum_type_count(); i++) {
4091     CrossLinkEnum(&file->enum_types_[i], proto.enum_type(i));
4092   }
4093 
4094   for (int i = 0; i < file->service_count(); i++) {
4095     CrossLinkService(&file->services_[i], proto.service(i));
4096   }
4097 }
4098 
CrossLinkMessage(Descriptor * message,const DescriptorProto & proto)4099 void DescriptorBuilder::CrossLinkMessage(
4100     Descriptor* message, const DescriptorProto& proto) {
4101   if (message->options_ == NULL) {
4102     message->options_ = &MessageOptions::default_instance();
4103   }
4104 
4105   for (int i = 0; i < message->nested_type_count(); i++) {
4106     CrossLinkMessage(&message->nested_types_[i], proto.nested_type(i));
4107   }
4108 
4109   for (int i = 0; i < message->enum_type_count(); i++) {
4110     CrossLinkEnum(&message->enum_types_[i], proto.enum_type(i));
4111   }
4112 
4113   for (int i = 0; i < message->field_count(); i++) {
4114     CrossLinkField(&message->fields_[i], proto.field(i));
4115   }
4116 
4117   for (int i = 0; i < message->extension_count(); i++) {
4118     CrossLinkField(&message->extensions_[i], proto.extension(i));
4119   }
4120 
4121   // Set up field array for each oneof.
4122 
4123   // First count the number of fields per oneof.
4124   for (int i = 0; i < message->field_count(); i++) {
4125     const OneofDescriptor* oneof_decl = message->field(i)->containing_oneof();
4126     if (oneof_decl != NULL) {
4127       // Must go through oneof_decls_ array to get a non-const version of the
4128       // OneofDescriptor.
4129       ++message->oneof_decls_[oneof_decl->index()].field_count_;
4130     }
4131   }
4132 
4133   // Then allocate the arrays.
4134   for (int i = 0; i < message->oneof_decl_count(); i++) {
4135     OneofDescriptor* oneof_decl = &message->oneof_decls_[i];
4136 
4137     if (oneof_decl->field_count() == 0) {
4138       AddError(message->full_name() + "." + oneof_decl->name(),
4139                proto.oneof_decl(i),
4140                DescriptorPool::ErrorCollector::NAME,
4141                "Oneof must have at least one field.");
4142     }
4143 
4144     oneof_decl->fields_ =
4145       tables_->AllocateArray<const FieldDescriptor*>(oneof_decl->field_count_);
4146     oneof_decl->field_count_ = 0;
4147   }
4148 
4149   // Then fill them in.
4150   for (int i = 0; i < message->field_count(); i++) {
4151     const OneofDescriptor* oneof_decl = message->field(i)->containing_oneof();
4152     if (oneof_decl != NULL) {
4153       OneofDescriptor* mutable_oneof_decl =
4154           &message->oneof_decls_[oneof_decl->index()];
4155       message->fields_[i].index_in_oneof_ = mutable_oneof_decl->field_count_;
4156       mutable_oneof_decl->fields_[mutable_oneof_decl->field_count_++] =
4157           message->field(i);
4158     }
4159   }
4160 }
4161 
CrossLinkField(FieldDescriptor * field,const FieldDescriptorProto & proto)4162 void DescriptorBuilder::CrossLinkField(
4163     FieldDescriptor* field, const FieldDescriptorProto& proto) {
4164   if (field->options_ == NULL) {
4165     field->options_ = &FieldOptions::default_instance();
4166   }
4167 
4168   if (proto.has_extendee()) {
4169     Symbol extendee = LookupSymbol(proto.extendee(), field->full_name(),
4170                                    PLACEHOLDER_EXTENDABLE_MESSAGE);
4171     if (extendee.IsNull()) {
4172       AddNotDefinedError(field->full_name(), proto,
4173                          DescriptorPool::ErrorCollector::EXTENDEE,
4174                          proto.extendee());
4175       return;
4176     } else if (extendee.type != Symbol::MESSAGE) {
4177       AddError(field->full_name(), proto,
4178                DescriptorPool::ErrorCollector::EXTENDEE,
4179                "\"" + proto.extendee() + "\" is not a message type.");
4180       return;
4181     }
4182     field->containing_type_ = extendee.descriptor;
4183 
4184     const Descriptor::ExtensionRange* extension_range = field->containing_type()
4185         ->FindExtensionRangeContainingNumber(field->number());
4186 
4187     if (extension_range == NULL) {
4188       AddError(field->full_name(), proto,
4189                DescriptorPool::ErrorCollector::NUMBER,
4190                strings::Substitute("\"$0\" does not declare $1 as an "
4191                                    "extension number.",
4192                                    field->containing_type()->full_name(),
4193                                    field->number()));
4194     }
4195   }
4196 
4197   if (field->containing_oneof() != NULL) {
4198     if (field->label() != FieldDescriptor::LABEL_OPTIONAL) {
4199       // Note that this error will never happen when parsing .proto files.
4200       // It can only happen if you manually construct a FileDescriptorProto
4201       // that is incorrect.
4202       AddError(field->full_name(), proto,
4203                DescriptorPool::ErrorCollector::NAME,
4204                "Fields of oneofs must themselves have label LABEL_OPTIONAL.");
4205     }
4206   }
4207 
4208   if (proto.has_type_name()) {
4209     // Assume we are expecting a message type unless the proto contains some
4210     // evidence that it expects an enum type.  This only makes a difference if
4211     // we end up creating a placeholder.
4212     bool expecting_enum = (proto.type() == FieldDescriptorProto::TYPE_ENUM) ||
4213                           proto.has_default_value();
4214 
4215     Symbol type =
4216       LookupSymbol(proto.type_name(), field->full_name(),
4217                    expecting_enum ? PLACEHOLDER_ENUM : PLACEHOLDER_MESSAGE,
4218                    LOOKUP_TYPES);
4219 
4220     // If the type is a weak type, we change the type to a google.protobuf.Empty field.
4221     if (type.IsNull() && !pool_->enforce_weak_ && proto.options().weak()) {
4222       type = FindSymbol(kNonLinkedWeakMessageReplacementName);
4223     }
4224 
4225     if (type.IsNull()) {
4226       AddNotDefinedError(field->full_name(), proto,
4227                          DescriptorPool::ErrorCollector::TYPE,
4228                          proto.type_name());
4229       return;
4230     }
4231 
4232     if (!proto.has_type()) {
4233       // Choose field type based on symbol.
4234       if (type.type == Symbol::MESSAGE) {
4235         field->type_ = FieldDescriptor::TYPE_MESSAGE;
4236       } else if (type.type == Symbol::ENUM) {
4237         field->type_ = FieldDescriptor::TYPE_ENUM;
4238       } else {
4239         AddError(field->full_name(), proto,
4240                  DescriptorPool::ErrorCollector::TYPE,
4241                  "\"" + proto.type_name() + "\" is not a type.");
4242         return;
4243       }
4244     }
4245 
4246     if (field->cpp_type() == FieldDescriptor::CPPTYPE_MESSAGE) {
4247       if (type.type != Symbol::MESSAGE) {
4248         AddError(field->full_name(), proto,
4249                  DescriptorPool::ErrorCollector::TYPE,
4250                  "\"" + proto.type_name() + "\" is not a message type.");
4251         return;
4252       }
4253       field->message_type_ = type.descriptor;
4254 
4255       if (field->has_default_value()) {
4256         AddError(field->full_name(), proto,
4257                  DescriptorPool::ErrorCollector::DEFAULT_VALUE,
4258                  "Messages can't have default values.");
4259       }
4260     } else if (field->cpp_type() == FieldDescriptor::CPPTYPE_ENUM) {
4261       if (type.type != Symbol::ENUM) {
4262         AddError(field->full_name(), proto,
4263                  DescriptorPool::ErrorCollector::TYPE,
4264                  "\"" + proto.type_name() + "\" is not an enum type.");
4265         return;
4266       }
4267       field->enum_type_ = type.enum_descriptor;
4268 
4269       if (field->enum_type()->is_placeholder_) {
4270         // We can't look up default values for placeholder types.  We'll have
4271         // to just drop them.
4272         field->has_default_value_ = false;
4273       }
4274 
4275       if (field->has_default_value()) {
4276         // Ensure that the default value is an identifier. Parser cannot always
4277         // verify this because it does not have complete type information.
4278         // N.B. that this check yields better error messages but is not
4279         // necessary for correctness (an enum symbol must be a valid identifier
4280         // anyway), only for better errors.
4281         if (!io::Tokenizer::IsIdentifier(proto.default_value())) {
4282           AddError(field->full_name(), proto,
4283                    DescriptorPool::ErrorCollector::DEFAULT_VALUE,
4284                    "Default value for an enum field must be an identifier.");
4285         } else {
4286           // We can't just use field->enum_type()->FindValueByName() here
4287           // because that locks the pool's mutex, which we have already locked
4288           // at this point.
4289           Symbol default_value =
4290             LookupSymbolNoPlaceholder(proto.default_value(),
4291                                       field->enum_type()->full_name());
4292 
4293           if (default_value.type == Symbol::ENUM_VALUE &&
4294               default_value.enum_value_descriptor->type() ==
4295               field->enum_type()) {
4296             field->default_value_enum_ = default_value.enum_value_descriptor;
4297           } else {
4298             AddError(field->full_name(), proto,
4299                      DescriptorPool::ErrorCollector::DEFAULT_VALUE,
4300                      "Enum type \"" + field->enum_type()->full_name() +
4301                      "\" has no value named \"" + proto.default_value() +
4302                      "\".");
4303           }
4304         }
4305       } else if (field->enum_type()->value_count() > 0) {
4306         // All enums must have at least one value, or we would have reported
4307         // an error elsewhere.  We use the first defined value as the default
4308         // if a default is not explicitly defined.
4309         field->default_value_enum_ = field->enum_type()->value(0);
4310       }
4311     } else {
4312       AddError(field->full_name(), proto, DescriptorPool::ErrorCollector::TYPE,
4313                "Field with primitive type has type_name.");
4314     }
4315   } else {
4316     if (field->cpp_type() == FieldDescriptor::CPPTYPE_MESSAGE ||
4317         field->cpp_type() == FieldDescriptor::CPPTYPE_ENUM) {
4318       AddError(field->full_name(), proto, DescriptorPool::ErrorCollector::TYPE,
4319                "Field with message or enum type missing type_name.");
4320     }
4321   }
4322 
4323   // Add the field to the fields-by-number table.
4324   // Note:  We have to do this *after* cross-linking because extensions do not
4325   //   know their containing type until now.
4326   if (!file_tables_->AddFieldByNumber(field)) {
4327     const FieldDescriptor* conflicting_field =
4328       file_tables_->FindFieldByNumber(field->containing_type(),
4329                                       field->number());
4330     if (field->is_extension()) {
4331       AddError(field->full_name(), proto,
4332                DescriptorPool::ErrorCollector::NUMBER,
4333                strings::Substitute("Extension number $0 has already been used "
4334                                    "in \"$1\" by extension \"$2\".",
4335                                    field->number(),
4336                                    field->containing_type()->full_name(),
4337                                    conflicting_field->full_name()));
4338     } else {
4339       AddError(field->full_name(), proto,
4340                DescriptorPool::ErrorCollector::NUMBER,
4341                strings::Substitute("Field number $0 has already been used in "
4342                                    "\"$1\" by field \"$2\".",
4343                                    field->number(),
4344                                    field->containing_type()->full_name(),
4345                                    conflicting_field->name()));
4346     }
4347   } else {
4348     if (field->is_extension()) {
4349       if (!tables_->AddExtension(field)) {
4350         const FieldDescriptor* conflicting_field =
4351             tables_->FindExtension(field->containing_type(), field->number());
4352         string error_msg = strings::Substitute(
4353             "Extension number $0 has already been used in \"$1\" by extension "
4354             "\"$2\" defined in $3.",
4355             field->number(),
4356             field->containing_type()->full_name(),
4357             conflicting_field->full_name(),
4358             conflicting_field->file()->name());
4359         // Conflicting extension numbers should be an error. However, before
4360         // turning this into an error we need to fix all existing broken
4361         // protos first.
4362         // TODO(xiaofeng): Change this to an error.
4363         AddWarning(field->full_name(), proto,
4364                    DescriptorPool::ErrorCollector::NUMBER, error_msg);
4365       }
4366     }
4367   }
4368 
4369   // Add the field to the lowercase-name and camelcase-name tables.
4370   file_tables_->AddFieldByStylizedNames(field);
4371 }
4372 
CrossLinkEnum(EnumDescriptor * enum_type,const EnumDescriptorProto & proto)4373 void DescriptorBuilder::CrossLinkEnum(
4374     EnumDescriptor* enum_type, const EnumDescriptorProto& proto) {
4375   if (enum_type->options_ == NULL) {
4376     enum_type->options_ = &EnumOptions::default_instance();
4377   }
4378 
4379   for (int i = 0; i < enum_type->value_count(); i++) {
4380     CrossLinkEnumValue(&enum_type->values_[i], proto.value(i));
4381   }
4382 }
4383 
CrossLinkEnumValue(EnumValueDescriptor * enum_value,const EnumValueDescriptorProto &)4384 void DescriptorBuilder::CrossLinkEnumValue(
4385     EnumValueDescriptor* enum_value,
4386     const EnumValueDescriptorProto& /* proto */) {
4387   if (enum_value->options_ == NULL) {
4388     enum_value->options_ = &EnumValueOptions::default_instance();
4389   }
4390 }
4391 
CrossLinkService(ServiceDescriptor * service,const ServiceDescriptorProto & proto)4392 void DescriptorBuilder::CrossLinkService(
4393     ServiceDescriptor* service, const ServiceDescriptorProto& proto) {
4394   if (service->options_ == NULL) {
4395     service->options_ = &ServiceOptions::default_instance();
4396   }
4397 
4398   for (int i = 0; i < service->method_count(); i++) {
4399     CrossLinkMethod(&service->methods_[i], proto.method(i));
4400   }
4401 }
4402 
CrossLinkMethod(MethodDescriptor * method,const MethodDescriptorProto & proto)4403 void DescriptorBuilder::CrossLinkMethod(
4404     MethodDescriptor* method, const MethodDescriptorProto& proto) {
4405   if (method->options_ == NULL) {
4406     method->options_ = &MethodOptions::default_instance();
4407   }
4408 
4409   Symbol input_type = LookupSymbol(proto.input_type(), method->full_name());
4410   if (input_type.IsNull()) {
4411     AddNotDefinedError(method->full_name(), proto,
4412                        DescriptorPool::ErrorCollector::INPUT_TYPE,
4413                        proto.input_type());
4414   } else if (input_type.type != Symbol::MESSAGE) {
4415     AddError(method->full_name(), proto,
4416              DescriptorPool::ErrorCollector::INPUT_TYPE,
4417              "\"" + proto.input_type() + "\" is not a message type.");
4418   } else {
4419     method->input_type_ = input_type.descriptor;
4420   }
4421 
4422   Symbol output_type = LookupSymbol(proto.output_type(), method->full_name());
4423   if (output_type.IsNull()) {
4424     AddNotDefinedError(method->full_name(), proto,
4425                        DescriptorPool::ErrorCollector::OUTPUT_TYPE,
4426                        proto.output_type());
4427   } else if (output_type.type != Symbol::MESSAGE) {
4428     AddError(method->full_name(), proto,
4429              DescriptorPool::ErrorCollector::OUTPUT_TYPE,
4430              "\"" + proto.output_type() + "\" is not a message type.");
4431   } else {
4432     method->output_type_ = output_type.descriptor;
4433   }
4434 }
4435 
4436 // -------------------------------------------------------------------
4437 
4438 #define VALIDATE_OPTIONS_FROM_ARRAY(descriptor, array_name, type)  \
4439   for (int i = 0; i < descriptor->array_name##_count(); ++i) {     \
4440     Validate##type##Options(descriptor->array_name##s_ + i,        \
4441                             proto.array_name(i));                  \
4442   }
4443 
4444 // Determine if the file uses optimize_for = LITE_RUNTIME, being careful to
4445 // avoid problems that exist at init time.
IsLite(const FileDescriptor * file)4446 static bool IsLite(const FileDescriptor* file) {
4447   // TODO(kenton):  I don't even remember how many of these conditions are
4448   //   actually possible.  I'm just being super-safe.
4449   return file != NULL &&
4450          &file->options() != &FileOptions::default_instance() &&
4451          file->options().optimize_for() == FileOptions::LITE_RUNTIME;
4452 }
4453 
ValidateFileOptions(FileDescriptor * file,const FileDescriptorProto & proto)4454 void DescriptorBuilder::ValidateFileOptions(FileDescriptor* file,
4455                                             const FileDescriptorProto& proto) {
4456   VALIDATE_OPTIONS_FROM_ARRAY(file, message_type, Message);
4457   VALIDATE_OPTIONS_FROM_ARRAY(file, enum_type, Enum);
4458   VALIDATE_OPTIONS_FROM_ARRAY(file, service, Service);
4459   VALIDATE_OPTIONS_FROM_ARRAY(file, extension, Field);
4460 
4461   // Lite files can only be imported by other Lite files.
4462   if (!IsLite(file)) {
4463     for (int i = 0; i < file->dependency_count(); i++) {
4464       if (IsLite(file->dependency(i))) {
4465         AddError(
4466           file->name(), proto,
4467           DescriptorPool::ErrorCollector::OTHER,
4468           "Files that do not use optimize_for = LITE_RUNTIME cannot import "
4469           "files which do use this option.  This file is not lite, but it "
4470           "imports \"" + file->dependency(i)->name() + "\" which is.");
4471         break;
4472       }
4473     }
4474   }
4475 }
4476 
4477 
ValidateMessageOptions(Descriptor * message,const DescriptorProto & proto)4478 void DescriptorBuilder::ValidateMessageOptions(Descriptor* message,
4479                                                const DescriptorProto& proto) {
4480   VALIDATE_OPTIONS_FROM_ARRAY(message, field, Field);
4481   VALIDATE_OPTIONS_FROM_ARRAY(message, nested_type, Message);
4482   VALIDATE_OPTIONS_FROM_ARRAY(message, enum_type, Enum);
4483   VALIDATE_OPTIONS_FROM_ARRAY(message, extension, Field);
4484 
4485   const int64 max_extension_range =
4486       static_cast<int64>(message->options().message_set_wire_format() ?
4487                          kint32max :
4488                          FieldDescriptor::kMaxNumber);
4489   for (int i = 0; i < message->extension_range_count(); ++i) {
4490     if (message->extension_range(i)->end > max_extension_range + 1) {
4491       AddError(
4492           message->full_name(), proto.extension_range(i),
4493           DescriptorPool::ErrorCollector::NUMBER,
4494           strings::Substitute("Extension numbers cannot be greater than $0.",
4495                               max_extension_range));
4496     }
4497   }
4498 }
4499 
ValidateFieldOptions(FieldDescriptor * field,const FieldDescriptorProto & proto)4500 void DescriptorBuilder::ValidateFieldOptions(FieldDescriptor* field,
4501     const FieldDescriptorProto& proto) {
4502   if (field->options().has_experimental_map_key()) {
4503     ValidateMapKey(field, proto);
4504   }
4505 
4506   // Only message type fields may be lazy.
4507   if (field->options().lazy()) {
4508     if (field->type() != FieldDescriptor::TYPE_MESSAGE) {
4509       AddError(field->full_name(), proto,
4510                DescriptorPool::ErrorCollector::TYPE,
4511                "[lazy = true] can only be specified for submessage fields.");
4512     }
4513   }
4514 
4515   // Only repeated primitive fields may be packed.
4516   if (field->options().packed() && !field->is_packable()) {
4517     AddError(
4518       field->full_name(), proto,
4519       DescriptorPool::ErrorCollector::TYPE,
4520       "[packed = true] can only be specified for repeated primitive fields.");
4521   }
4522 
4523   // Note:  Default instance may not yet be initialized here, so we have to
4524   //   avoid reading from it.
4525   if (field->containing_type_ != NULL &&
4526       &field->containing_type()->options() !=
4527       &MessageOptions::default_instance() &&
4528       field->containing_type()->options().message_set_wire_format()) {
4529     if (field->is_extension()) {
4530       if (!field->is_optional() ||
4531           field->type() != FieldDescriptor::TYPE_MESSAGE) {
4532         AddError(field->full_name(), proto,
4533                  DescriptorPool::ErrorCollector::TYPE,
4534                  "Extensions of MessageSets must be optional messages.");
4535       }
4536     } else {
4537       AddError(field->full_name(), proto,
4538                DescriptorPool::ErrorCollector::NAME,
4539                "MessageSets cannot have fields, only extensions.");
4540     }
4541   }
4542 
4543   // Lite extensions can only be of Lite types.
4544   if (IsLite(field->file()) &&
4545       field->containing_type_ != NULL &&
4546       !IsLite(field->containing_type()->file())) {
4547     AddError(field->full_name(), proto,
4548              DescriptorPool::ErrorCollector::EXTENDEE,
4549              "Extensions to non-lite types can only be declared in non-lite "
4550              "files.  Note that you cannot extend a non-lite type to contain "
4551              "a lite type, but the reverse is allowed.");
4552   }
4553 
4554 }
4555 
ValidateEnumOptions(EnumDescriptor * enm,const EnumDescriptorProto & proto)4556 void DescriptorBuilder::ValidateEnumOptions(EnumDescriptor* enm,
4557                                             const EnumDescriptorProto& proto) {
4558   VALIDATE_OPTIONS_FROM_ARRAY(enm, value, EnumValue);
4559   if (!enm->options().has_allow_alias() || !enm->options().allow_alias()) {
4560     map<int, string> used_values;
4561     for (int i = 0; i < enm->value_count(); ++i) {
4562       const EnumValueDescriptor* enum_value = enm->value(i);
4563       if (used_values.find(enum_value->number()) != used_values.end()) {
4564         string error =
4565             "\"" + enum_value->full_name() +
4566             "\" uses the same enum value as \"" +
4567             used_values[enum_value->number()] + "\". If this is intended, set "
4568             "'option allow_alias = true;' to the enum definition.";
4569         if (!enm->options().allow_alias()) {
4570           // Generate error if duplicated enum values are explicitly disallowed.
4571           AddError(enm->full_name(), proto,
4572                    DescriptorPool::ErrorCollector::NUMBER,
4573                    error);
4574         } else {
4575           // Generate warning if duplicated values are found but the option
4576           // isn't set.
4577           GOOGLE_LOG(ERROR) << error;
4578         }
4579       } else {
4580         used_values[enum_value->number()] = enum_value->full_name();
4581       }
4582     }
4583   }
4584 }
4585 
ValidateEnumValueOptions(EnumValueDescriptor *,const EnumValueDescriptorProto &)4586 void DescriptorBuilder::ValidateEnumValueOptions(
4587     EnumValueDescriptor* /* enum_value */,
4588     const EnumValueDescriptorProto& /* proto */) {
4589   // Nothing to do so far.
4590 }
ValidateServiceOptions(ServiceDescriptor * service,const ServiceDescriptorProto & proto)4591 void DescriptorBuilder::ValidateServiceOptions(ServiceDescriptor* service,
4592     const ServiceDescriptorProto& proto) {
4593   if (IsLite(service->file()) &&
4594       (service->file()->options().cc_generic_services() ||
4595        service->file()->options().java_generic_services())) {
4596     AddError(service->full_name(), proto,
4597              DescriptorPool::ErrorCollector::NAME,
4598              "Files with optimize_for = LITE_RUNTIME cannot define services "
4599              "unless you set both options cc_generic_services and "
4600              "java_generic_sevices to false.");
4601   }
4602 
4603   VALIDATE_OPTIONS_FROM_ARRAY(service, method, Method);
4604 }
4605 
ValidateMethodOptions(MethodDescriptor *,const MethodDescriptorProto &)4606 void DescriptorBuilder::ValidateMethodOptions(MethodDescriptor* /* method */,
4607     const MethodDescriptorProto& /* proto */) {
4608   // Nothing to do so far.
4609 }
4610 
ValidateMapKey(FieldDescriptor * field,const FieldDescriptorProto & proto)4611 void DescriptorBuilder::ValidateMapKey(FieldDescriptor* field,
4612                                        const FieldDescriptorProto& proto) {
4613   if (!field->is_repeated()) {
4614     AddError(field->full_name(), proto, DescriptorPool::ErrorCollector::TYPE,
4615              "map type is only allowed for repeated fields.");
4616     return;
4617   }
4618 
4619   if (field->cpp_type() != FieldDescriptor::CPPTYPE_MESSAGE) {
4620     AddError(field->full_name(), proto, DescriptorPool::ErrorCollector::TYPE,
4621              "map type is only allowed for fields with a message type.");
4622     return;
4623   }
4624 
4625   const Descriptor* item_type = field->message_type();
4626   if (item_type == NULL) {
4627     AddError(field->full_name(), proto, DescriptorPool::ErrorCollector::TYPE,
4628              "Could not find field type.");
4629     return;
4630   }
4631 
4632   // Find the field in item_type named by "experimental_map_key"
4633   const string& key_name = field->options().experimental_map_key();
4634   const Symbol key_symbol = LookupSymbol(
4635       key_name,
4636       // We append ".key_name" to the containing type's name since
4637       // LookupSymbol() searches for peers of the supplied name, not
4638       // children of the supplied name.
4639       item_type->full_name() + "." + key_name);
4640 
4641   if (key_symbol.IsNull() || key_symbol.field_descriptor->is_extension()) {
4642     AddError(field->full_name(), proto, DescriptorPool::ErrorCollector::TYPE,
4643              "Could not find field named \"" + key_name + "\" in type \"" +
4644              item_type->full_name() + "\".");
4645     return;
4646   }
4647   const FieldDescriptor* key_field = key_symbol.field_descriptor;
4648 
4649   if (key_field->is_repeated()) {
4650     AddError(field->full_name(), proto, DescriptorPool::ErrorCollector::TYPE,
4651              "map_key must not name a repeated field.");
4652     return;
4653   }
4654 
4655   if (key_field->cpp_type() == FieldDescriptor::CPPTYPE_MESSAGE) {
4656     AddError(field->full_name(), proto, DescriptorPool::ErrorCollector::TYPE,
4657              "map key must name a scalar or string field.");
4658     return;
4659   }
4660 
4661   field->experimental_map_key_ = key_field;
4662 }
4663 
4664 
4665 #undef VALIDATE_OPTIONS_FROM_ARRAY
4666 
4667 // -------------------------------------------------------------------
4668 
OptionInterpreter(DescriptorBuilder * builder)4669 DescriptorBuilder::OptionInterpreter::OptionInterpreter(
4670     DescriptorBuilder* builder) : builder_(builder) {
4671   GOOGLE_CHECK(builder_);
4672 }
4673 
~OptionInterpreter()4674 DescriptorBuilder::OptionInterpreter::~OptionInterpreter() {
4675 }
4676 
InterpretOptions(OptionsToInterpret * options_to_interpret)4677 bool DescriptorBuilder::OptionInterpreter::InterpretOptions(
4678     OptionsToInterpret* options_to_interpret) {
4679   // Note that these may be in different pools, so we can't use the same
4680   // descriptor and reflection objects on both.
4681   Message* options = options_to_interpret->options;
4682   const Message* original_options = options_to_interpret->original_options;
4683 
4684   bool failed = false;
4685   options_to_interpret_ = options_to_interpret;
4686 
4687   // Find the uninterpreted_option field in the mutable copy of the options
4688   // and clear them, since we're about to interpret them.
4689   const FieldDescriptor* uninterpreted_options_field =
4690       options->GetDescriptor()->FindFieldByName("uninterpreted_option");
4691   GOOGLE_CHECK(uninterpreted_options_field != NULL)
4692       << "No field named \"uninterpreted_option\" in the Options proto.";
4693   options->GetReflection()->ClearField(options, uninterpreted_options_field);
4694 
4695   // Find the uninterpreted_option field in the original options.
4696   const FieldDescriptor* original_uninterpreted_options_field =
4697       original_options->GetDescriptor()->
4698           FindFieldByName("uninterpreted_option");
4699   GOOGLE_CHECK(original_uninterpreted_options_field != NULL)
4700       << "No field named \"uninterpreted_option\" in the Options proto.";
4701 
4702   const int num_uninterpreted_options = original_options->GetReflection()->
4703       FieldSize(*original_options, original_uninterpreted_options_field);
4704   for (int i = 0; i < num_uninterpreted_options; ++i) {
4705     uninterpreted_option_ = down_cast<const UninterpretedOption*>(
4706         &original_options->GetReflection()->GetRepeatedMessage(
4707             *original_options, original_uninterpreted_options_field, i));
4708     if (!InterpretSingleOption(options)) {
4709       // Error already added by InterpretSingleOption().
4710       failed = true;
4711       break;
4712     }
4713   }
4714   // Reset these, so we don't have any dangling pointers.
4715   uninterpreted_option_ = NULL;
4716   options_to_interpret_ = NULL;
4717 
4718   if (!failed) {
4719     // InterpretSingleOption() added the interpreted options in the
4720     // UnknownFieldSet, in case the option isn't yet known to us.  Now we
4721     // serialize the options message and deserialize it back.  That way, any
4722     // option fields that we do happen to know about will get moved from the
4723     // UnknownFieldSet into the real fields, and thus be available right away.
4724     // If they are not known, that's OK too. They will get reparsed into the
4725     // UnknownFieldSet and wait there until the message is parsed by something
4726     // that does know about the options.
4727     string buf;
4728     options->AppendToString(&buf);
4729     GOOGLE_CHECK(options->ParseFromString(buf))
4730         << "Protocol message serialized itself in invalid fashion.";
4731   }
4732 
4733   return !failed;
4734 }
4735 
InterpretSingleOption(Message * options)4736 bool DescriptorBuilder::OptionInterpreter::InterpretSingleOption(
4737     Message* options) {
4738   // First do some basic validation.
4739   if (uninterpreted_option_->name_size() == 0) {
4740     // This should never happen unless the parser has gone seriously awry or
4741     // someone has manually created the uninterpreted option badly.
4742     return AddNameError("Option must have a name.");
4743   }
4744   if (uninterpreted_option_->name(0).name_part() == "uninterpreted_option") {
4745     return AddNameError("Option must not use reserved name "
4746                         "\"uninterpreted_option\".");
4747   }
4748 
4749   const Descriptor* options_descriptor = NULL;
4750   // Get the options message's descriptor from the builder's pool, so that we
4751   // get the version that knows about any extension options declared in the
4752   // file we're currently building. The descriptor should be there as long as
4753   // the file we're building imported "google/protobuf/descriptors.proto".
4754 
4755   // Note that we use DescriptorBuilder::FindSymbolNotEnforcingDeps(), not
4756   // DescriptorPool::FindMessageTypeByName() because we're already holding the
4757   // pool's mutex, and the latter method locks it again.  We don't use
4758   // FindSymbol() because files that use custom options only need to depend on
4759   // the file that defines the option, not descriptor.proto itself.
4760   Symbol symbol = builder_->FindSymbolNotEnforcingDeps(
4761     options->GetDescriptor()->full_name());
4762   if (!symbol.IsNull() && symbol.type == Symbol::MESSAGE) {
4763     options_descriptor = symbol.descriptor;
4764   } else {
4765     // The options message's descriptor was not in the builder's pool, so use
4766     // the standard version from the generated pool. We're not holding the
4767     // generated pool's mutex, so we can search it the straightforward way.
4768     options_descriptor = options->GetDescriptor();
4769   }
4770   GOOGLE_CHECK(options_descriptor);
4771 
4772   // We iterate over the name parts to drill into the submessages until we find
4773   // the leaf field for the option. As we drill down we remember the current
4774   // submessage's descriptor in |descriptor| and the next field in that
4775   // submessage in |field|. We also track the fields we're drilling down
4776   // through in |intermediate_fields|. As we go, we reconstruct the full option
4777   // name in |debug_msg_name|, for use in error messages.
4778   const Descriptor* descriptor = options_descriptor;
4779   const FieldDescriptor* field = NULL;
4780   vector<const FieldDescriptor*> intermediate_fields;
4781   string debug_msg_name = "";
4782 
4783   for (int i = 0; i < uninterpreted_option_->name_size(); ++i) {
4784     const string& name_part = uninterpreted_option_->name(i).name_part();
4785     if (debug_msg_name.size() > 0) {
4786       debug_msg_name += ".";
4787     }
4788     if (uninterpreted_option_->name(i).is_extension()) {
4789       debug_msg_name += "(" + name_part + ")";
4790       // Search for the extension's descriptor as an extension in the builder's
4791       // pool. Note that we use DescriptorBuilder::LookupSymbol(), not
4792       // DescriptorPool::FindExtensionByName(), for two reasons: 1) It allows
4793       // relative lookups, and 2) because we're already holding the pool's
4794       // mutex, and the latter method locks it again.
4795       symbol = builder_->LookupSymbol(name_part,
4796                                       options_to_interpret_->name_scope);
4797       if (!symbol.IsNull() && symbol.type == Symbol::FIELD) {
4798         field = symbol.field_descriptor;
4799       }
4800       // If we don't find the field then the field's descriptor was not in the
4801       // builder's pool, but there's no point in looking in the generated
4802       // pool. We require that you import the file that defines any extensions
4803       // you use, so they must be present in the builder's pool.
4804     } else {
4805       debug_msg_name += name_part;
4806       // Search for the field's descriptor as a regular field.
4807       field = descriptor->FindFieldByName(name_part);
4808     }
4809 
4810     if (field == NULL) {
4811       if (get_allow_unknown(builder_->pool_)) {
4812         // We can't find the option, but AllowUnknownDependencies() is enabled,
4813         // so we will just leave it as uninterpreted.
4814         AddWithoutInterpreting(*uninterpreted_option_, options);
4815         return true;
4816       } else if (!(builder_->undefine_resolved_name_).empty()) {
4817         // Option is resolved to a name which is not defined.
4818         return AddNameError(
4819             "Option \"" + debug_msg_name + "\" is resolved to \"(" +
4820             builder_->undefine_resolved_name_ +
4821             ")\", which is not defined. The innermost scope is searched first "
4822             "in name resolution. Consider using a leading '.'(i.e., \"(." +
4823             debug_msg_name.substr(1) +
4824             "\") to start from the outermost scope.");
4825       } else {
4826         return AddNameError("Option \"" + debug_msg_name + "\" unknown.");
4827       }
4828     } else if (field->containing_type() != descriptor) {
4829       if (get_is_placeholder(field->containing_type())) {
4830         // The field is an extension of a placeholder type, so we can't
4831         // reliably verify whether it is a valid extension to use here (e.g.
4832         // we don't know if it is an extension of the correct *Options message,
4833         // or if it has a valid field number, etc.).  Just leave it as
4834         // uninterpreted instead.
4835         AddWithoutInterpreting(*uninterpreted_option_, options);
4836         return true;
4837       } else {
4838         // This can only happen if, due to some insane misconfiguration of the
4839         // pools, we find the options message in one pool but the field in
4840         // another. This would probably imply a hefty bug somewhere.
4841         return AddNameError("Option field \"" + debug_msg_name +
4842                             "\" is not a field or extension of message \"" +
4843                             descriptor->name() + "\".");
4844       }
4845     } else if (i < uninterpreted_option_->name_size() - 1) {
4846       if (field->cpp_type() != FieldDescriptor::CPPTYPE_MESSAGE) {
4847         return AddNameError("Option \"" +  debug_msg_name +
4848                             "\" is an atomic type, not a message.");
4849       } else if (field->is_repeated()) {
4850         return AddNameError("Option field \"" + debug_msg_name +
4851                             "\" is a repeated message. Repeated message "
4852                             "options must be initialized using an "
4853                             "aggregate value.");
4854       } else {
4855         // Drill down into the submessage.
4856         intermediate_fields.push_back(field);
4857         descriptor = field->message_type();
4858       }
4859     }
4860   }
4861 
4862   // We've found the leaf field. Now we use UnknownFieldSets to set its value
4863   // on the options message. We do so because the message may not yet know
4864   // about its extension fields, so we may not be able to set the fields
4865   // directly. But the UnknownFieldSets will serialize to the same wire-format
4866   // message, so reading that message back in once the extension fields are
4867   // known will populate them correctly.
4868 
4869   // First see if the option is already set.
4870   if (!field->is_repeated() && !ExamineIfOptionIsSet(
4871           intermediate_fields.begin(),
4872           intermediate_fields.end(),
4873           field, debug_msg_name,
4874           options->GetReflection()->GetUnknownFields(*options))) {
4875     return false;  // ExamineIfOptionIsSet() already added the error.
4876   }
4877 
4878 
4879   // First set the value on the UnknownFieldSet corresponding to the
4880   // innermost message.
4881   scoped_ptr<UnknownFieldSet> unknown_fields(new UnknownFieldSet());
4882   if (!SetOptionValue(field, unknown_fields.get())) {
4883     return false;  // SetOptionValue() already added the error.
4884   }
4885 
4886   // Now wrap the UnknownFieldSet with UnknownFieldSets corresponding to all
4887   // the intermediate messages.
4888   for (vector<const FieldDescriptor*>::reverse_iterator iter =
4889            intermediate_fields.rbegin();
4890        iter != intermediate_fields.rend(); ++iter) {
4891     scoped_ptr<UnknownFieldSet> parent_unknown_fields(new UnknownFieldSet());
4892     switch ((*iter)->type()) {
4893       case FieldDescriptor::TYPE_MESSAGE: {
4894         io::StringOutputStream outstr(
4895             parent_unknown_fields->AddLengthDelimited((*iter)->number()));
4896         io::CodedOutputStream out(&outstr);
4897         internal::WireFormat::SerializeUnknownFields(*unknown_fields, &out);
4898         GOOGLE_CHECK(!out.HadError())
4899             << "Unexpected failure while serializing option submessage "
4900             << debug_msg_name << "\".";
4901         break;
4902       }
4903 
4904       case FieldDescriptor::TYPE_GROUP: {
4905          parent_unknown_fields->AddGroup((*iter)->number())
4906                               ->MergeFrom(*unknown_fields);
4907         break;
4908       }
4909 
4910       default:
4911         GOOGLE_LOG(FATAL) << "Invalid wire type for CPPTYPE_MESSAGE: "
4912                    << (*iter)->type();
4913         return false;
4914     }
4915     unknown_fields.reset(parent_unknown_fields.release());
4916   }
4917 
4918   // Now merge the UnknownFieldSet corresponding to the top-level message into
4919   // the options message.
4920   options->GetReflection()->MutableUnknownFields(options)->MergeFrom(
4921       *unknown_fields);
4922 
4923   return true;
4924 }
4925 
AddWithoutInterpreting(const UninterpretedOption & uninterpreted_option,Message * options)4926 void DescriptorBuilder::OptionInterpreter::AddWithoutInterpreting(
4927     const UninterpretedOption& uninterpreted_option, Message* options) {
4928   const FieldDescriptor* field =
4929     options->GetDescriptor()->FindFieldByName("uninterpreted_option");
4930   GOOGLE_CHECK(field != NULL);
4931 
4932   options->GetReflection()->AddMessage(options, field)
4933     ->CopyFrom(uninterpreted_option);
4934 }
4935 
ExamineIfOptionIsSet(vector<const FieldDescriptor * >::const_iterator intermediate_fields_iter,vector<const FieldDescriptor * >::const_iterator intermediate_fields_end,const FieldDescriptor * innermost_field,const string & debug_msg_name,const UnknownFieldSet & unknown_fields)4936 bool DescriptorBuilder::OptionInterpreter::ExamineIfOptionIsSet(
4937     vector<const FieldDescriptor*>::const_iterator intermediate_fields_iter,
4938     vector<const FieldDescriptor*>::const_iterator intermediate_fields_end,
4939     const FieldDescriptor* innermost_field, const string& debug_msg_name,
4940     const UnknownFieldSet& unknown_fields) {
4941   // We do linear searches of the UnknownFieldSet and its sub-groups.  This
4942   // should be fine since it's unlikely that any one options structure will
4943   // contain more than a handful of options.
4944 
4945   if (intermediate_fields_iter == intermediate_fields_end) {
4946     // We're at the innermost submessage.
4947     for (int i = 0; i < unknown_fields.field_count(); i++) {
4948       if (unknown_fields.field(i).number() == innermost_field->number()) {
4949         return AddNameError("Option \"" + debug_msg_name +
4950                             "\" was already set.");
4951       }
4952     }
4953     return true;
4954   }
4955 
4956   for (int i = 0; i < unknown_fields.field_count(); i++) {
4957     if (unknown_fields.field(i).number() ==
4958         (*intermediate_fields_iter)->number()) {
4959       const UnknownField* unknown_field = &unknown_fields.field(i);
4960       FieldDescriptor::Type type = (*intermediate_fields_iter)->type();
4961       // Recurse into the next submessage.
4962       switch (type) {
4963         case FieldDescriptor::TYPE_MESSAGE:
4964           if (unknown_field->type() == UnknownField::TYPE_LENGTH_DELIMITED) {
4965             UnknownFieldSet intermediate_unknown_fields;
4966             if (intermediate_unknown_fields.ParseFromString(
4967                     unknown_field->length_delimited()) &&
4968                 !ExamineIfOptionIsSet(intermediate_fields_iter + 1,
4969                                       intermediate_fields_end,
4970                                       innermost_field, debug_msg_name,
4971                                       intermediate_unknown_fields)) {
4972               return false;  // Error already added.
4973             }
4974           }
4975           break;
4976 
4977         case FieldDescriptor::TYPE_GROUP:
4978           if (unknown_field->type() == UnknownField::TYPE_GROUP) {
4979             if (!ExamineIfOptionIsSet(intermediate_fields_iter + 1,
4980                                       intermediate_fields_end,
4981                                       innermost_field, debug_msg_name,
4982                                       unknown_field->group())) {
4983               return false;  // Error already added.
4984             }
4985           }
4986           break;
4987 
4988         default:
4989           GOOGLE_LOG(FATAL) << "Invalid wire type for CPPTYPE_MESSAGE: " << type;
4990           return false;
4991       }
4992     }
4993   }
4994   return true;
4995 }
4996 
SetOptionValue(const FieldDescriptor * option_field,UnknownFieldSet * unknown_fields)4997 bool DescriptorBuilder::OptionInterpreter::SetOptionValue(
4998     const FieldDescriptor* option_field,
4999     UnknownFieldSet* unknown_fields) {
5000   // We switch on the CppType to validate.
5001   switch (option_field->cpp_type()) {
5002 
5003     case FieldDescriptor::CPPTYPE_INT32:
5004       if (uninterpreted_option_->has_positive_int_value()) {
5005         if (uninterpreted_option_->positive_int_value() >
5006             static_cast<uint64>(kint32max)) {
5007           return AddValueError("Value out of range for int32 option \"" +
5008                                option_field->full_name() + "\".");
5009         } else {
5010           SetInt32(option_field->number(),
5011                    uninterpreted_option_->positive_int_value(),
5012                    option_field->type(), unknown_fields);
5013         }
5014       } else if (uninterpreted_option_->has_negative_int_value()) {
5015         if (uninterpreted_option_->negative_int_value() <
5016             static_cast<int64>(kint32min)) {
5017           return AddValueError("Value out of range for int32 option \"" +
5018                                option_field->full_name() + "\".");
5019         } else {
5020           SetInt32(option_field->number(),
5021                    uninterpreted_option_->negative_int_value(),
5022                    option_field->type(), unknown_fields);
5023         }
5024       } else {
5025         return AddValueError("Value must be integer for int32 option \"" +
5026                              option_field->full_name() + "\".");
5027       }
5028       break;
5029 
5030     case FieldDescriptor::CPPTYPE_INT64:
5031       if (uninterpreted_option_->has_positive_int_value()) {
5032         if (uninterpreted_option_->positive_int_value() >
5033             static_cast<uint64>(kint64max)) {
5034           return AddValueError("Value out of range for int64 option \"" +
5035                                option_field->full_name() + "\".");
5036         } else {
5037           SetInt64(option_field->number(),
5038                    uninterpreted_option_->positive_int_value(),
5039                    option_field->type(), unknown_fields);
5040         }
5041       } else if (uninterpreted_option_->has_negative_int_value()) {
5042         SetInt64(option_field->number(),
5043                  uninterpreted_option_->negative_int_value(),
5044                  option_field->type(), unknown_fields);
5045       } else {
5046         return AddValueError("Value must be integer for int64 option \"" +
5047                              option_field->full_name() + "\".");
5048       }
5049       break;
5050 
5051     case FieldDescriptor::CPPTYPE_UINT32:
5052       if (uninterpreted_option_->has_positive_int_value()) {
5053         if (uninterpreted_option_->positive_int_value() > kuint32max) {
5054           return AddValueError("Value out of range for uint32 option \"" +
5055                                option_field->name() + "\".");
5056         } else {
5057           SetUInt32(option_field->number(),
5058                     uninterpreted_option_->positive_int_value(),
5059                     option_field->type(), unknown_fields);
5060         }
5061       } else {
5062         return AddValueError("Value must be non-negative integer for uint32 "
5063                              "option \"" + option_field->full_name() + "\".");
5064       }
5065       break;
5066 
5067     case FieldDescriptor::CPPTYPE_UINT64:
5068       if (uninterpreted_option_->has_positive_int_value()) {
5069         SetUInt64(option_field->number(),
5070                   uninterpreted_option_->positive_int_value(),
5071                   option_field->type(), unknown_fields);
5072       } else {
5073         return AddValueError("Value must be non-negative integer for uint64 "
5074                              "option \"" + option_field->full_name() + "\".");
5075       }
5076       break;
5077 
5078     case FieldDescriptor::CPPTYPE_FLOAT: {
5079       float value;
5080       if (uninterpreted_option_->has_double_value()) {
5081         value = uninterpreted_option_->double_value();
5082       } else if (uninterpreted_option_->has_positive_int_value()) {
5083         value = uninterpreted_option_->positive_int_value();
5084       } else if (uninterpreted_option_->has_negative_int_value()) {
5085         value = uninterpreted_option_->negative_int_value();
5086       } else {
5087         return AddValueError("Value must be number for float option \"" +
5088                              option_field->full_name() + "\".");
5089       }
5090       unknown_fields->AddFixed32(option_field->number(),
5091           google::protobuf::internal::WireFormatLite::EncodeFloat(value));
5092       break;
5093     }
5094 
5095     case FieldDescriptor::CPPTYPE_DOUBLE: {
5096       double value;
5097       if (uninterpreted_option_->has_double_value()) {
5098         value = uninterpreted_option_->double_value();
5099       } else if (uninterpreted_option_->has_positive_int_value()) {
5100         value = uninterpreted_option_->positive_int_value();
5101       } else if (uninterpreted_option_->has_negative_int_value()) {
5102         value = uninterpreted_option_->negative_int_value();
5103       } else {
5104         return AddValueError("Value must be number for double option \"" +
5105                              option_field->full_name() + "\".");
5106       }
5107       unknown_fields->AddFixed64(option_field->number(),
5108           google::protobuf::internal::WireFormatLite::EncodeDouble(value));
5109       break;
5110     }
5111 
5112     case FieldDescriptor::CPPTYPE_BOOL:
5113       uint64 value;
5114       if (!uninterpreted_option_->has_identifier_value()) {
5115         return AddValueError("Value must be identifier for boolean option "
5116                              "\"" + option_field->full_name() + "\".");
5117       }
5118       if (uninterpreted_option_->identifier_value() == "true") {
5119         value = 1;
5120       } else if (uninterpreted_option_->identifier_value() == "false") {
5121         value = 0;
5122       } else {
5123         return AddValueError("Value must be \"true\" or \"false\" for boolean "
5124                              "option \"" + option_field->full_name() + "\".");
5125       }
5126       unknown_fields->AddVarint(option_field->number(), value);
5127       break;
5128 
5129     case FieldDescriptor::CPPTYPE_ENUM: {
5130       if (!uninterpreted_option_->has_identifier_value()) {
5131         return AddValueError("Value must be identifier for enum-valued option "
5132                              "\"" + option_field->full_name() + "\".");
5133       }
5134       const EnumDescriptor* enum_type = option_field->enum_type();
5135       const string& value_name = uninterpreted_option_->identifier_value();
5136       const EnumValueDescriptor* enum_value = NULL;
5137 
5138       if (enum_type->file()->pool() != DescriptorPool::generated_pool()) {
5139         // Note that the enum value's fully-qualified name is a sibling of the
5140         // enum's name, not a child of it.
5141         string fully_qualified_name = enum_type->full_name();
5142         fully_qualified_name.resize(fully_qualified_name.size() -
5143                                     enum_type->name().size());
5144         fully_qualified_name += value_name;
5145 
5146         // Search for the enum value's descriptor in the builder's pool. Note
5147         // that we use DescriptorBuilder::FindSymbolNotEnforcingDeps(), not
5148         // DescriptorPool::FindEnumValueByName() because we're already holding
5149         // the pool's mutex, and the latter method locks it again.
5150         Symbol symbol =
5151           builder_->FindSymbolNotEnforcingDeps(fully_qualified_name);
5152         if (!symbol.IsNull() && symbol.type == Symbol::ENUM_VALUE) {
5153           if (symbol.enum_value_descriptor->type() != enum_type) {
5154             return AddValueError("Enum type \"" + enum_type->full_name() +
5155                 "\" has no value named \"" + value_name + "\" for option \"" +
5156                 option_field->full_name() +
5157                 "\". This appears to be a value from a sibling type.");
5158           } else {
5159             enum_value = symbol.enum_value_descriptor;
5160           }
5161         }
5162       } else {
5163         // The enum type is in the generated pool, so we can search for the
5164         // value there.
5165         enum_value = enum_type->FindValueByName(value_name);
5166       }
5167 
5168       if (enum_value == NULL) {
5169         return AddValueError("Enum type \"" +
5170                              option_field->enum_type()->full_name() +
5171                              "\" has no value named \"" + value_name + "\" for "
5172                              "option \"" + option_field->full_name() + "\".");
5173       } else {
5174         // Sign-extension is not a problem, since we cast directly from int32 to
5175         // uint64, without first going through uint32.
5176         unknown_fields->AddVarint(option_field->number(),
5177           static_cast<uint64>(static_cast<int64>(enum_value->number())));
5178       }
5179       break;
5180     }
5181 
5182     case FieldDescriptor::CPPTYPE_STRING:
5183       if (!uninterpreted_option_->has_string_value()) {
5184         return AddValueError("Value must be quoted string for string option "
5185                              "\"" + option_field->full_name() + "\".");
5186       }
5187       // The string has already been unquoted and unescaped by the parser.
5188       unknown_fields->AddLengthDelimited(option_field->number(),
5189           uninterpreted_option_->string_value());
5190       break;
5191 
5192     case FieldDescriptor::CPPTYPE_MESSAGE:
5193       if (!SetAggregateOption(option_field, unknown_fields)) {
5194         return false;
5195       }
5196       break;
5197   }
5198 
5199   return true;
5200 }
5201 
5202 class DescriptorBuilder::OptionInterpreter::AggregateOptionFinder
5203     : public TextFormat::Finder {
5204  public:
5205   DescriptorBuilder* builder_;
5206 
FindExtension(Message * message,const string & name) const5207   virtual const FieldDescriptor* FindExtension(
5208       Message* message, const string& name) const {
5209     assert_mutex_held(builder_->pool_);
5210     const Descriptor* descriptor = message->GetDescriptor();
5211     Symbol result = builder_->LookupSymbolNoPlaceholder(
5212         name, descriptor->full_name());
5213     if (result.type == Symbol::FIELD &&
5214         result.field_descriptor->is_extension()) {
5215       return result.field_descriptor;
5216     } else if (result.type == Symbol::MESSAGE &&
5217                descriptor->options().message_set_wire_format()) {
5218       const Descriptor* foreign_type = result.descriptor;
5219       // The text format allows MessageSet items to be specified using
5220       // the type name, rather than the extension identifier. If the symbol
5221       // lookup returned a Message, and the enclosing Message has
5222       // message_set_wire_format = true, then return the message set
5223       // extension, if one exists.
5224       for (int i = 0; i < foreign_type->extension_count(); i++) {
5225         const FieldDescriptor* extension = foreign_type->extension(i);
5226         if (extension->containing_type() == descriptor &&
5227             extension->type() == FieldDescriptor::TYPE_MESSAGE &&
5228             extension->is_optional() &&
5229             extension->message_type() == foreign_type) {
5230           // Found it.
5231           return extension;
5232         }
5233       }
5234     }
5235     return NULL;
5236   }
5237 };
5238 
5239 // A custom error collector to record any text-format parsing errors
5240 namespace {
5241 class AggregateErrorCollector : public io::ErrorCollector {
5242  public:
5243   string error_;
5244 
AddError(int,int,const string & message)5245   virtual void AddError(int /* line */, int /* column */,
5246                         const string& message) {
5247     if (!error_.empty()) {
5248       error_ += "; ";
5249     }
5250     error_ += message;
5251   }
5252 
AddWarning(int,int,const string &)5253   virtual void AddWarning(int /* line */, int /* column */,
5254                           const string& /* message */) {
5255     // Ignore warnings
5256   }
5257 };
5258 }
5259 
5260 // We construct a dynamic message of the type corresponding to
5261 // option_field, parse the supplied text-format string into this
5262 // message, and serialize the resulting message to produce the value.
SetAggregateOption(const FieldDescriptor * option_field,UnknownFieldSet * unknown_fields)5263 bool DescriptorBuilder::OptionInterpreter::SetAggregateOption(
5264     const FieldDescriptor* option_field,
5265     UnknownFieldSet* unknown_fields) {
5266   if (!uninterpreted_option_->has_aggregate_value()) {
5267     return AddValueError("Option \"" + option_field->full_name() +
5268                          "\" is a message. To set the entire message, use "
5269                          "syntax like \"" + option_field->name() +
5270                          " = { <proto text format> }\". "
5271                          "To set fields within it, use "
5272                          "syntax like \"" + option_field->name() +
5273                          ".foo = value\".");
5274   }
5275 
5276   const Descriptor* type = option_field->message_type();
5277   scoped_ptr<Message> dynamic(dynamic_factory_.GetPrototype(type)->New());
5278   GOOGLE_CHECK(dynamic.get() != NULL)
5279       << "Could not create an instance of " << option_field->DebugString();
5280 
5281   AggregateErrorCollector collector;
5282   AggregateOptionFinder finder;
5283   finder.builder_ = builder_;
5284   TextFormat::Parser parser;
5285   parser.RecordErrorsTo(&collector);
5286   parser.SetFinder(&finder);
5287   if (!parser.ParseFromString(uninterpreted_option_->aggregate_value(),
5288                               dynamic.get())) {
5289     AddValueError("Error while parsing option value for \"" +
5290                   option_field->name() + "\": " + collector.error_);
5291     return false;
5292   } else {
5293     string serial;
5294     dynamic->SerializeToString(&serial);  // Never fails
5295     if (option_field->type() == FieldDescriptor::TYPE_MESSAGE) {
5296       unknown_fields->AddLengthDelimited(option_field->number(), serial);
5297     } else {
5298       GOOGLE_CHECK_EQ(option_field->type(),  FieldDescriptor::TYPE_GROUP);
5299       UnknownFieldSet* group = unknown_fields->AddGroup(option_field->number());
5300       group->ParseFromString(serial);
5301     }
5302     return true;
5303   }
5304 }
5305 
SetInt32(int number,int32 value,FieldDescriptor::Type type,UnknownFieldSet * unknown_fields)5306 void DescriptorBuilder::OptionInterpreter::SetInt32(int number, int32 value,
5307     FieldDescriptor::Type type, UnknownFieldSet* unknown_fields) {
5308   switch (type) {
5309     case FieldDescriptor::TYPE_INT32:
5310       unknown_fields->AddVarint(number,
5311         static_cast<uint64>(static_cast<int64>(value)));
5312       break;
5313 
5314     case FieldDescriptor::TYPE_SFIXED32:
5315       unknown_fields->AddFixed32(number, static_cast<uint32>(value));
5316       break;
5317 
5318     case FieldDescriptor::TYPE_SINT32:
5319       unknown_fields->AddVarint(number,
5320           google::protobuf::internal::WireFormatLite::ZigZagEncode32(value));
5321       break;
5322 
5323     default:
5324       GOOGLE_LOG(FATAL) << "Invalid wire type for CPPTYPE_INT32: " << type;
5325       break;
5326   }
5327 }
5328 
SetInt64(int number,int64 value,FieldDescriptor::Type type,UnknownFieldSet * unknown_fields)5329 void DescriptorBuilder::OptionInterpreter::SetInt64(int number, int64 value,
5330     FieldDescriptor::Type type, UnknownFieldSet* unknown_fields) {
5331   switch (type) {
5332     case FieldDescriptor::TYPE_INT64:
5333       unknown_fields->AddVarint(number, static_cast<uint64>(value));
5334       break;
5335 
5336     case FieldDescriptor::TYPE_SFIXED64:
5337       unknown_fields->AddFixed64(number, static_cast<uint64>(value));
5338       break;
5339 
5340     case FieldDescriptor::TYPE_SINT64:
5341       unknown_fields->AddVarint(number,
5342           google::protobuf::internal::WireFormatLite::ZigZagEncode64(value));
5343       break;
5344 
5345     default:
5346       GOOGLE_LOG(FATAL) << "Invalid wire type for CPPTYPE_INT64: " << type;
5347       break;
5348   }
5349 }
5350 
SetUInt32(int number,uint32 value,FieldDescriptor::Type type,UnknownFieldSet * unknown_fields)5351 void DescriptorBuilder::OptionInterpreter::SetUInt32(int number, uint32 value,
5352     FieldDescriptor::Type type, UnknownFieldSet* unknown_fields) {
5353   switch (type) {
5354     case FieldDescriptor::TYPE_UINT32:
5355       unknown_fields->AddVarint(number, static_cast<uint64>(value));
5356       break;
5357 
5358     case FieldDescriptor::TYPE_FIXED32:
5359       unknown_fields->AddFixed32(number, static_cast<uint32>(value));
5360       break;
5361 
5362     default:
5363       GOOGLE_LOG(FATAL) << "Invalid wire type for CPPTYPE_UINT32: " << type;
5364       break;
5365   }
5366 }
5367 
SetUInt64(int number,uint64 value,FieldDescriptor::Type type,UnknownFieldSet * unknown_fields)5368 void DescriptorBuilder::OptionInterpreter::SetUInt64(int number, uint64 value,
5369     FieldDescriptor::Type type, UnknownFieldSet* unknown_fields) {
5370   switch (type) {
5371     case FieldDescriptor::TYPE_UINT64:
5372       unknown_fields->AddVarint(number, value);
5373       break;
5374 
5375     case FieldDescriptor::TYPE_FIXED64:
5376       unknown_fields->AddFixed64(number, value);
5377       break;
5378 
5379     default:
5380       GOOGLE_LOG(FATAL) << "Invalid wire type for CPPTYPE_UINT64: " << type;
5381       break;
5382   }
5383 }
5384 
LogUnusedDependency(const FileDescriptor * result)5385 void DescriptorBuilder::LogUnusedDependency(const FileDescriptor* result) {
5386 
5387   if (!unused_dependency_.empty()) {
5388     std::set<string> annotation_extensions;
5389     annotation_extensions.insert("google.protobuf.MessageOptions");
5390     annotation_extensions.insert("google.protobuf.FileOptions");
5391     annotation_extensions.insert("google.protobuf.FieldOptions");
5392     annotation_extensions.insert("google.protobuf.EnumOptions");
5393     annotation_extensions.insert("google.protobuf.EnumValueOptions");
5394     annotation_extensions.insert("google.protobuf.ServiceOptions");
5395     annotation_extensions.insert("google.protobuf.MethodOptions");
5396     annotation_extensions.insert("google.protobuf.StreamOptions");
5397     for (set<const FileDescriptor*>::const_iterator
5398              it = unused_dependency_.begin();
5399          it != unused_dependency_.end(); ++it) {
5400       // Do not log warnings for proto files which extend annotations.
5401       int i;
5402       for (i = 0 ; i < (*it)->extension_count(); ++i) {
5403         if (annotation_extensions.find(
5404                 (*it)->extension(i)->containing_type()->full_name())
5405             != annotation_extensions.end()) {
5406           break;
5407         }
5408       }
5409       // Log warnings for unused imported files.
5410       if (i == (*it)->extension_count()) {
5411         GOOGLE_LOG(WARNING) << "Warning: Unused import: \"" << result->name()
5412                      << "\" imports \"" << (*it)->name()
5413                      << "\" which is not used.";
5414       }
5415     }
5416   }
5417 }
5418 
5419 }  // namespace protobuf
5420 }  // namespace google
5421