1 //===--- ASTMatchFinder.cpp - Structural query framework ------------------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 //  Implements an algorithm to efficiently search for matches on AST nodes.
11 //  Uses memoization to support recursive matches like HasDescendant.
12 //
13 //  The general idea is to visit all AST nodes with a RecursiveASTVisitor,
14 //  calling the Matches(...) method of each matcher we are running on each
15 //  AST node. The matcher can recurse via the ASTMatchFinder interface.
16 //
17 //===----------------------------------------------------------------------===//
18 
19 #include "clang/ASTMatchers/ASTMatchFinder.h"
20 #include "clang/AST/ASTConsumer.h"
21 #include "clang/AST/ASTContext.h"
22 #include "clang/AST/RecursiveASTVisitor.h"
23 #include "llvm/ADT/DenseMap.h"
24 #include "llvm/ADT/StringMap.h"
25 #include "llvm/Support/Timer.h"
26 #include <deque>
27 #include <memory>
28 #include <set>
29 
30 namespace clang {
31 namespace ast_matchers {
32 namespace internal {
33 namespace {
34 
35 typedef MatchFinder::MatchCallback MatchCallback;
36 
37 // The maximum number of memoization entries to store.
38 // 10k has been experimentally found to give a good trade-off
39 // of performance vs. memory consumption by running matcher
40 // that match on every statement over a very large codebase.
41 //
42 // FIXME: Do some performance optimization in general and
43 // revisit this number; also, put up micro-benchmarks that we can
44 // optimize this on.
45 static const unsigned MaxMemoizationEntries = 10000;
46 
47 // We use memoization to avoid running the same matcher on the same
48 // AST node twice.  This struct is the key for looking up match
49 // result.  It consists of an ID of the MatcherInterface (for
50 // identifying the matcher), a pointer to the AST node and the
51 // bound nodes before the matcher was executed.
52 //
53 // We currently only memoize on nodes whose pointers identify the
54 // nodes (\c Stmt and \c Decl, but not \c QualType or \c TypeLoc).
55 // For \c QualType and \c TypeLoc it is possible to implement
56 // generation of keys for each type.
57 // FIXME: Benchmark whether memoization of non-pointer typed nodes
58 // provides enough benefit for the additional amount of code.
59 struct MatchKey {
60   DynTypedMatcher::MatcherIDType MatcherID;
61   ast_type_traits::DynTypedNode Node;
62   BoundNodesTreeBuilder BoundNodes;
63 
operator <clang::ast_matchers::internal::__anonf927a3570111::MatchKey64   bool operator<(const MatchKey &Other) const {
65     return std::tie(MatcherID, Node, BoundNodes) <
66            std::tie(Other.MatcherID, Other.Node, Other.BoundNodes);
67   }
68 };
69 
70 // Used to store the result of a match and possibly bound nodes.
71 struct MemoizedMatchResult {
72   bool ResultOfMatch;
73   BoundNodesTreeBuilder Nodes;
74 };
75 
76 // A RecursiveASTVisitor that traverses all children or all descendants of
77 // a node.
78 class MatchChildASTVisitor
79     : public RecursiveASTVisitor<MatchChildASTVisitor> {
80 public:
81   typedef RecursiveASTVisitor<MatchChildASTVisitor> VisitorBase;
82 
83   // Creates an AST visitor that matches 'matcher' on all children or
84   // descendants of a traversed node. max_depth is the maximum depth
85   // to traverse: use 1 for matching the children and INT_MAX for
86   // matching the descendants.
MatchChildASTVisitor(const DynTypedMatcher * Matcher,ASTMatchFinder * Finder,BoundNodesTreeBuilder * Builder,int MaxDepth,ASTMatchFinder::TraversalKind Traversal,ASTMatchFinder::BindKind Bind)87   MatchChildASTVisitor(const DynTypedMatcher *Matcher,
88                        ASTMatchFinder *Finder,
89                        BoundNodesTreeBuilder *Builder,
90                        int MaxDepth,
91                        ASTMatchFinder::TraversalKind Traversal,
92                        ASTMatchFinder::BindKind Bind)
93       : Matcher(Matcher),
94         Finder(Finder),
95         Builder(Builder),
96         CurrentDepth(0),
97         MaxDepth(MaxDepth),
98         Traversal(Traversal),
99         Bind(Bind),
100         Matches(false) {}
101 
102   // Returns true if a match is found in the subtree rooted at the
103   // given AST node. This is done via a set of mutually recursive
104   // functions. Here's how the recursion is done (the  *wildcard can
105   // actually be Decl, Stmt, or Type):
106   //
107   //   - Traverse(node) calls BaseTraverse(node) when it needs
108   //     to visit the descendants of node.
109   //   - BaseTraverse(node) then calls (via VisitorBase::Traverse*(node))
110   //     Traverse*(c) for each child c of 'node'.
111   //   - Traverse*(c) in turn calls Traverse(c), completing the
112   //     recursion.
findMatch(const ast_type_traits::DynTypedNode & DynNode)113   bool findMatch(const ast_type_traits::DynTypedNode &DynNode) {
114     reset();
115     if (const Decl *D = DynNode.get<Decl>())
116       traverse(*D);
117     else if (const Stmt *S = DynNode.get<Stmt>())
118       traverse(*S);
119     else if (const NestedNameSpecifier *NNS =
120              DynNode.get<NestedNameSpecifier>())
121       traverse(*NNS);
122     else if (const NestedNameSpecifierLoc *NNSLoc =
123              DynNode.get<NestedNameSpecifierLoc>())
124       traverse(*NNSLoc);
125     else if (const QualType *Q = DynNode.get<QualType>())
126       traverse(*Q);
127     else if (const TypeLoc *T = DynNode.get<TypeLoc>())
128       traverse(*T);
129     // FIXME: Add other base types after adding tests.
130 
131     // It's OK to always overwrite the bound nodes, as if there was
132     // no match in this recursive branch, the result set is empty
133     // anyway.
134     *Builder = ResultBindings;
135 
136     return Matches;
137   }
138 
139   // The following are overriding methods from the base visitor class.
140   // They are public only to allow CRTP to work. They are *not *part
141   // of the public API of this class.
TraverseDecl(Decl * DeclNode)142   bool TraverseDecl(Decl *DeclNode) {
143     ScopedIncrement ScopedDepth(&CurrentDepth);
144     return (DeclNode == nullptr) || traverse(*DeclNode);
145   }
TraverseStmt(Stmt * StmtNode)146   bool TraverseStmt(Stmt *StmtNode) {
147     ScopedIncrement ScopedDepth(&CurrentDepth);
148     const Stmt *StmtToTraverse = StmtNode;
149     if (Traversal ==
150         ASTMatchFinder::TK_IgnoreImplicitCastsAndParentheses) {
151       const Expr *ExprNode = dyn_cast_or_null<Expr>(StmtNode);
152       if (ExprNode) {
153         StmtToTraverse = ExprNode->IgnoreParenImpCasts();
154       }
155     }
156     return (StmtToTraverse == nullptr) || traverse(*StmtToTraverse);
157   }
158   // We assume that the QualType and the contained type are on the same
159   // hierarchy level. Thus, we try to match either of them.
TraverseType(QualType TypeNode)160   bool TraverseType(QualType TypeNode) {
161     if (TypeNode.isNull())
162       return true;
163     ScopedIncrement ScopedDepth(&CurrentDepth);
164     // Match the Type.
165     if (!match(*TypeNode))
166       return false;
167     // The QualType is matched inside traverse.
168     return traverse(TypeNode);
169   }
170   // We assume that the TypeLoc, contained QualType and contained Type all are
171   // on the same hierarchy level. Thus, we try to match all of them.
TraverseTypeLoc(TypeLoc TypeLocNode)172   bool TraverseTypeLoc(TypeLoc TypeLocNode) {
173     if (TypeLocNode.isNull())
174       return true;
175     ScopedIncrement ScopedDepth(&CurrentDepth);
176     // Match the Type.
177     if (!match(*TypeLocNode.getType()))
178       return false;
179     // Match the QualType.
180     if (!match(TypeLocNode.getType()))
181       return false;
182     // The TypeLoc is matched inside traverse.
183     return traverse(TypeLocNode);
184   }
TraverseNestedNameSpecifier(NestedNameSpecifier * NNS)185   bool TraverseNestedNameSpecifier(NestedNameSpecifier *NNS) {
186     ScopedIncrement ScopedDepth(&CurrentDepth);
187     return (NNS == nullptr) || traverse(*NNS);
188   }
TraverseNestedNameSpecifierLoc(NestedNameSpecifierLoc NNS)189   bool TraverseNestedNameSpecifierLoc(NestedNameSpecifierLoc NNS) {
190     if (!NNS)
191       return true;
192     ScopedIncrement ScopedDepth(&CurrentDepth);
193     if (!match(*NNS.getNestedNameSpecifier()))
194       return false;
195     return traverse(NNS);
196   }
197 
shouldVisitTemplateInstantiations() const198   bool shouldVisitTemplateInstantiations() const { return true; }
shouldVisitImplicitCode() const199   bool shouldVisitImplicitCode() const { return true; }
200 
201 private:
202   // Used for updating the depth during traversal.
203   struct ScopedIncrement {
ScopedIncrementclang::ast_matchers::internal::__anonf927a3570111::MatchChildASTVisitor::ScopedIncrement204     explicit ScopedIncrement(int *Depth) : Depth(Depth) { ++(*Depth); }
~ScopedIncrementclang::ast_matchers::internal::__anonf927a3570111::MatchChildASTVisitor::ScopedIncrement205     ~ScopedIncrement() { --(*Depth); }
206 
207    private:
208     int *Depth;
209   };
210 
211   // Resets the state of this object.
reset()212   void reset() {
213     Matches = false;
214     CurrentDepth = 0;
215   }
216 
217   // Forwards the call to the corresponding Traverse*() method in the
218   // base visitor class.
baseTraverse(const Decl & DeclNode)219   bool baseTraverse(const Decl &DeclNode) {
220     return VisitorBase::TraverseDecl(const_cast<Decl*>(&DeclNode));
221   }
baseTraverse(const Stmt & StmtNode)222   bool baseTraverse(const Stmt &StmtNode) {
223     return VisitorBase::TraverseStmt(const_cast<Stmt*>(&StmtNode));
224   }
baseTraverse(QualType TypeNode)225   bool baseTraverse(QualType TypeNode) {
226     return VisitorBase::TraverseType(TypeNode);
227   }
baseTraverse(TypeLoc TypeLocNode)228   bool baseTraverse(TypeLoc TypeLocNode) {
229     return VisitorBase::TraverseTypeLoc(TypeLocNode);
230   }
baseTraverse(const NestedNameSpecifier & NNS)231   bool baseTraverse(const NestedNameSpecifier &NNS) {
232     return VisitorBase::TraverseNestedNameSpecifier(
233         const_cast<NestedNameSpecifier*>(&NNS));
234   }
baseTraverse(NestedNameSpecifierLoc NNS)235   bool baseTraverse(NestedNameSpecifierLoc NNS) {
236     return VisitorBase::TraverseNestedNameSpecifierLoc(NNS);
237   }
238 
239   // Sets 'Matched' to true if 'Matcher' matches 'Node' and:
240   //   0 < CurrentDepth <= MaxDepth.
241   //
242   // Returns 'true' if traversal should continue after this function
243   // returns, i.e. if no match is found or 'Bind' is 'BK_All'.
244   template <typename T>
match(const T & Node)245   bool match(const T &Node) {
246     if (CurrentDepth == 0 || CurrentDepth > MaxDepth) {
247       return true;
248     }
249     if (Bind != ASTMatchFinder::BK_All) {
250       BoundNodesTreeBuilder RecursiveBuilder(*Builder);
251       if (Matcher->matches(ast_type_traits::DynTypedNode::create(Node), Finder,
252                            &RecursiveBuilder)) {
253         Matches = true;
254         ResultBindings.addMatch(RecursiveBuilder);
255         return false; // Abort as soon as a match is found.
256       }
257     } else {
258       BoundNodesTreeBuilder RecursiveBuilder(*Builder);
259       if (Matcher->matches(ast_type_traits::DynTypedNode::create(Node), Finder,
260                            &RecursiveBuilder)) {
261         // After the first match the matcher succeeds.
262         Matches = true;
263         ResultBindings.addMatch(RecursiveBuilder);
264       }
265     }
266     return true;
267   }
268 
269   // Traverses the subtree rooted at 'Node'; returns true if the
270   // traversal should continue after this function returns.
271   template <typename T>
traverse(const T & Node)272   bool traverse(const T &Node) {
273     static_assert(IsBaseType<T>::value,
274                   "traverse can only be instantiated with base type");
275     if (!match(Node))
276       return false;
277     return baseTraverse(Node);
278   }
279 
280   const DynTypedMatcher *const Matcher;
281   ASTMatchFinder *const Finder;
282   BoundNodesTreeBuilder *const Builder;
283   BoundNodesTreeBuilder ResultBindings;
284   int CurrentDepth;
285   const int MaxDepth;
286   const ASTMatchFinder::TraversalKind Traversal;
287   const ASTMatchFinder::BindKind Bind;
288   bool Matches;
289 };
290 
291 // Controls the outermost traversal of the AST and allows to match multiple
292 // matchers.
293 class MatchASTVisitor : public RecursiveASTVisitor<MatchASTVisitor>,
294                         public ASTMatchFinder {
295 public:
MatchASTVisitor(const MatchFinder::MatchersByType * Matchers,const MatchFinder::MatchFinderOptions & Options)296   MatchASTVisitor(const MatchFinder::MatchersByType *Matchers,
297                   const MatchFinder::MatchFinderOptions &Options)
298       : Matchers(Matchers), Options(Options), ActiveASTContext(nullptr) {}
299 
~MatchASTVisitor()300   ~MatchASTVisitor() override {
301     if (Options.CheckProfiling) {
302       Options.CheckProfiling->Records = std::move(TimeByBucket);
303     }
304   }
305 
onStartOfTranslationUnit()306   void onStartOfTranslationUnit() {
307     const bool EnableCheckProfiling = Options.CheckProfiling.hasValue();
308     TimeBucketRegion Timer;
309     for (MatchCallback *MC : Matchers->AllCallbacks) {
310       if (EnableCheckProfiling)
311         Timer.setBucket(&TimeByBucket[MC->getID()]);
312       MC->onStartOfTranslationUnit();
313     }
314   }
315 
onEndOfTranslationUnit()316   void onEndOfTranslationUnit() {
317     const bool EnableCheckProfiling = Options.CheckProfiling.hasValue();
318     TimeBucketRegion Timer;
319     for (MatchCallback *MC : Matchers->AllCallbacks) {
320       if (EnableCheckProfiling)
321         Timer.setBucket(&TimeByBucket[MC->getID()]);
322       MC->onEndOfTranslationUnit();
323     }
324   }
325 
set_active_ast_context(ASTContext * NewActiveASTContext)326   void set_active_ast_context(ASTContext *NewActiveASTContext) {
327     ActiveASTContext = NewActiveASTContext;
328   }
329 
330   // The following Visit*() and Traverse*() functions "override"
331   // methods in RecursiveASTVisitor.
332 
VisitTypedefNameDecl(TypedefNameDecl * DeclNode)333   bool VisitTypedefNameDecl(TypedefNameDecl *DeclNode) {
334     // When we see 'typedef A B', we add name 'B' to the set of names
335     // A's canonical type maps to.  This is necessary for implementing
336     // isDerivedFrom(x) properly, where x can be the name of the base
337     // class or any of its aliases.
338     //
339     // In general, the is-alias-of (as defined by typedefs) relation
340     // is tree-shaped, as you can typedef a type more than once.  For
341     // example,
342     //
343     //   typedef A B;
344     //   typedef A C;
345     //   typedef C D;
346     //   typedef C E;
347     //
348     // gives you
349     //
350     //   A
351     //   |- B
352     //   `- C
353     //      |- D
354     //      `- E
355     //
356     // It is wrong to assume that the relation is a chain.  A correct
357     // implementation of isDerivedFrom() needs to recognize that B and
358     // E are aliases, even though neither is a typedef of the other.
359     // Therefore, we cannot simply walk through one typedef chain to
360     // find out whether the type name matches.
361     const Type *TypeNode = DeclNode->getUnderlyingType().getTypePtr();
362     const Type *CanonicalType =  // root of the typedef tree
363         ActiveASTContext->getCanonicalType(TypeNode);
364     TypeAliases[CanonicalType].insert(DeclNode);
365     return true;
366   }
367 
368   bool TraverseDecl(Decl *DeclNode);
369   bool TraverseStmt(Stmt *StmtNode);
370   bool TraverseType(QualType TypeNode);
371   bool TraverseTypeLoc(TypeLoc TypeNode);
372   bool TraverseNestedNameSpecifier(NestedNameSpecifier *NNS);
373   bool TraverseNestedNameSpecifierLoc(NestedNameSpecifierLoc NNS);
374 
375   // Matches children or descendants of 'Node' with 'BaseMatcher'.
memoizedMatchesRecursively(const ast_type_traits::DynTypedNode & Node,const DynTypedMatcher & Matcher,BoundNodesTreeBuilder * Builder,int MaxDepth,TraversalKind Traversal,BindKind Bind)376   bool memoizedMatchesRecursively(const ast_type_traits::DynTypedNode &Node,
377                                   const DynTypedMatcher &Matcher,
378                                   BoundNodesTreeBuilder *Builder, int MaxDepth,
379                                   TraversalKind Traversal, BindKind Bind) {
380     // For AST-nodes that don't have an identity, we can't memoize.
381     if (!Node.getMemoizationData() || !Builder->isComparable())
382       return matchesRecursively(Node, Matcher, Builder, MaxDepth, Traversal,
383                                 Bind);
384 
385     MatchKey Key;
386     Key.MatcherID = Matcher.getID();
387     Key.Node = Node;
388     // Note that we key on the bindings *before* the match.
389     Key.BoundNodes = *Builder;
390 
391     MemoizationMap::iterator I = ResultCache.find(Key);
392     if (I != ResultCache.end()) {
393       *Builder = I->second.Nodes;
394       return I->second.ResultOfMatch;
395     }
396 
397     MemoizedMatchResult Result;
398     Result.Nodes = *Builder;
399     Result.ResultOfMatch = matchesRecursively(Node, Matcher, &Result.Nodes,
400                                               MaxDepth, Traversal, Bind);
401 
402     MemoizedMatchResult &CachedResult = ResultCache[Key];
403     CachedResult = std::move(Result);
404 
405     *Builder = CachedResult.Nodes;
406     return CachedResult.ResultOfMatch;
407   }
408 
409   // Matches children or descendants of 'Node' with 'BaseMatcher'.
matchesRecursively(const ast_type_traits::DynTypedNode & Node,const DynTypedMatcher & Matcher,BoundNodesTreeBuilder * Builder,int MaxDepth,TraversalKind Traversal,BindKind Bind)410   bool matchesRecursively(const ast_type_traits::DynTypedNode &Node,
411                           const DynTypedMatcher &Matcher,
412                           BoundNodesTreeBuilder *Builder, int MaxDepth,
413                           TraversalKind Traversal, BindKind Bind) {
414     MatchChildASTVisitor Visitor(
415       &Matcher, this, Builder, MaxDepth, Traversal, Bind);
416     return Visitor.findMatch(Node);
417   }
418 
419   bool classIsDerivedFrom(const CXXRecordDecl *Declaration,
420                           const Matcher<NamedDecl> &Base,
421                           BoundNodesTreeBuilder *Builder) override;
422 
423   // Implements ASTMatchFinder::matchesChildOf.
matchesChildOf(const ast_type_traits::DynTypedNode & Node,const DynTypedMatcher & Matcher,BoundNodesTreeBuilder * Builder,TraversalKind Traversal,BindKind Bind)424   bool matchesChildOf(const ast_type_traits::DynTypedNode &Node,
425                       const DynTypedMatcher &Matcher,
426                       BoundNodesTreeBuilder *Builder,
427                       TraversalKind Traversal,
428                       BindKind Bind) override {
429     if (ResultCache.size() > MaxMemoizationEntries)
430       ResultCache.clear();
431     return memoizedMatchesRecursively(Node, Matcher, Builder, 1, Traversal,
432                                       Bind);
433   }
434   // Implements ASTMatchFinder::matchesDescendantOf.
matchesDescendantOf(const ast_type_traits::DynTypedNode & Node,const DynTypedMatcher & Matcher,BoundNodesTreeBuilder * Builder,BindKind Bind)435   bool matchesDescendantOf(const ast_type_traits::DynTypedNode &Node,
436                            const DynTypedMatcher &Matcher,
437                            BoundNodesTreeBuilder *Builder,
438                            BindKind Bind) override {
439     if (ResultCache.size() > MaxMemoizationEntries)
440       ResultCache.clear();
441     return memoizedMatchesRecursively(Node, Matcher, Builder, INT_MAX,
442                                       TK_AsIs, Bind);
443   }
444   // Implements ASTMatchFinder::matchesAncestorOf.
matchesAncestorOf(const ast_type_traits::DynTypedNode & Node,const DynTypedMatcher & Matcher,BoundNodesTreeBuilder * Builder,AncestorMatchMode MatchMode)445   bool matchesAncestorOf(const ast_type_traits::DynTypedNode &Node,
446                          const DynTypedMatcher &Matcher,
447                          BoundNodesTreeBuilder *Builder,
448                          AncestorMatchMode MatchMode) override {
449     // Reset the cache outside of the recursive call to make sure we
450     // don't invalidate any iterators.
451     if (ResultCache.size() > MaxMemoizationEntries)
452       ResultCache.clear();
453     return memoizedMatchesAncestorOfRecursively(Node, Matcher, Builder,
454                                                 MatchMode);
455   }
456 
457   // Matches all registered matchers on the given node and calls the
458   // result callback for every node that matches.
match(const ast_type_traits::DynTypedNode & Node)459   void match(const ast_type_traits::DynTypedNode &Node) {
460     // FIXME: Improve this with a switch or a visitor pattern.
461     if (auto *N = Node.get<Decl>()) {
462       match(*N);
463     } else if (auto *N = Node.get<Stmt>()) {
464       match(*N);
465     } else if (auto *N = Node.get<Type>()) {
466       match(*N);
467     } else if (auto *N = Node.get<QualType>()) {
468       match(*N);
469     } else if (auto *N = Node.get<NestedNameSpecifier>()) {
470       match(*N);
471     } else if (auto *N = Node.get<NestedNameSpecifierLoc>()) {
472       match(*N);
473     } else if (auto *N = Node.get<TypeLoc>()) {
474       match(*N);
475     }
476   }
477 
match(const T & Node)478   template <typename T> void match(const T &Node) {
479     matchDispatch(&Node);
480   }
481 
482   // Implements ASTMatchFinder::getASTContext.
getASTContext() const483   ASTContext &getASTContext() const override { return *ActiveASTContext; }
484 
shouldVisitTemplateInstantiations() const485   bool shouldVisitTemplateInstantiations() const { return true; }
shouldVisitImplicitCode() const486   bool shouldVisitImplicitCode() const { return true; }
487 
488 private:
489   class TimeBucketRegion {
490   public:
TimeBucketRegion()491     TimeBucketRegion() : Bucket(nullptr) {}
~TimeBucketRegion()492     ~TimeBucketRegion() { setBucket(nullptr); }
493 
494     /// \brief Start timing for \p NewBucket.
495     ///
496     /// If there was a bucket already set, it will finish the timing for that
497     /// other bucket.
498     /// \p NewBucket will be timed until the next call to \c setBucket() or
499     /// until the \c TimeBucketRegion is destroyed.
500     /// If \p NewBucket is the same as the currently timed bucket, this call
501     /// does nothing.
setBucket(llvm::TimeRecord * NewBucket)502     void setBucket(llvm::TimeRecord *NewBucket) {
503       if (Bucket != NewBucket) {
504         auto Now = llvm::TimeRecord::getCurrentTime(true);
505         if (Bucket)
506           *Bucket += Now;
507         if (NewBucket)
508           *NewBucket -= Now;
509         Bucket = NewBucket;
510       }
511     }
512 
513   private:
514     llvm::TimeRecord *Bucket;
515   };
516 
517   /// \brief Runs all the \p Matchers on \p Node.
518   ///
519   /// Used by \c matchDispatch() below.
520   template <typename T, typename MC>
matchWithoutFilter(const T & Node,const MC & Matchers)521   void matchWithoutFilter(const T &Node, const MC &Matchers) {
522     const bool EnableCheckProfiling = Options.CheckProfiling.hasValue();
523     TimeBucketRegion Timer;
524     for (const auto &MP : Matchers) {
525       if (EnableCheckProfiling)
526         Timer.setBucket(&TimeByBucket[MP.second->getID()]);
527       BoundNodesTreeBuilder Builder;
528       if (MP.first.matches(Node, this, &Builder)) {
529         MatchVisitor Visitor(ActiveASTContext, MP.second);
530         Builder.visitMatches(&Visitor);
531       }
532     }
533   }
534 
matchWithFilter(const ast_type_traits::DynTypedNode & DynNode)535   void matchWithFilter(const ast_type_traits::DynTypedNode &DynNode) {
536     auto Kind = DynNode.getNodeKind();
537     auto it = MatcherFiltersMap.find(Kind);
538     const auto &Filter =
539         it != MatcherFiltersMap.end() ? it->second : getFilterForKind(Kind);
540 
541     if (Filter.empty())
542       return;
543 
544     const bool EnableCheckProfiling = Options.CheckProfiling.hasValue();
545     TimeBucketRegion Timer;
546     auto &Matchers = this->Matchers->DeclOrStmt;
547     for (unsigned short I : Filter) {
548       auto &MP = Matchers[I];
549       if (EnableCheckProfiling)
550         Timer.setBucket(&TimeByBucket[MP.second->getID()]);
551       BoundNodesTreeBuilder Builder;
552       if (MP.first.matchesNoKindCheck(DynNode, this, &Builder)) {
553         MatchVisitor Visitor(ActiveASTContext, MP.second);
554         Builder.visitMatches(&Visitor);
555       }
556     }
557   }
558 
559   const std::vector<unsigned short> &
getFilterForKind(ast_type_traits::ASTNodeKind Kind)560   getFilterForKind(ast_type_traits::ASTNodeKind Kind) {
561     auto &Filter = MatcherFiltersMap[Kind];
562     auto &Matchers = this->Matchers->DeclOrStmt;
563     assert((Matchers.size() < USHRT_MAX) && "Too many matchers.");
564     for (unsigned I = 0, E = Matchers.size(); I != E; ++I) {
565       if (Matchers[I].first.canMatchNodesOfKind(Kind)) {
566         Filter.push_back(I);
567       }
568     }
569     return Filter;
570   }
571 
572   /// @{
573   /// \brief Overloads to pair the different node types to their matchers.
matchDispatch(const Decl * Node)574   void matchDispatch(const Decl *Node) {
575     return matchWithFilter(ast_type_traits::DynTypedNode::create(*Node));
576   }
matchDispatch(const Stmt * Node)577   void matchDispatch(const Stmt *Node) {
578     return matchWithFilter(ast_type_traits::DynTypedNode::create(*Node));
579   }
580 
matchDispatch(const Type * Node)581   void matchDispatch(const Type *Node) {
582     matchWithoutFilter(QualType(Node, 0), Matchers->Type);
583   }
matchDispatch(const TypeLoc * Node)584   void matchDispatch(const TypeLoc *Node) {
585     matchWithoutFilter(*Node, Matchers->TypeLoc);
586   }
matchDispatch(const QualType * Node)587   void matchDispatch(const QualType *Node) {
588     matchWithoutFilter(*Node, Matchers->Type);
589   }
matchDispatch(const NestedNameSpecifier * Node)590   void matchDispatch(const NestedNameSpecifier *Node) {
591     matchWithoutFilter(*Node, Matchers->NestedNameSpecifier);
592   }
matchDispatch(const NestedNameSpecifierLoc * Node)593   void matchDispatch(const NestedNameSpecifierLoc *Node) {
594     matchWithoutFilter(*Node, Matchers->NestedNameSpecifierLoc);
595   }
matchDispatch(const void *)596   void matchDispatch(const void *) { /* Do nothing. */ }
597   /// @}
598 
599   // Returns whether an ancestor of \p Node matches \p Matcher.
600   //
601   // The order of matching ((which can lead to different nodes being bound in
602   // case there are multiple matches) is breadth first search.
603   //
604   // To allow memoization in the very common case of having deeply nested
605   // expressions inside a template function, we first walk up the AST, memoizing
606   // the result of the match along the way, as long as there is only a single
607   // parent.
608   //
609   // Once there are multiple parents, the breadth first search order does not
610   // allow simple memoization on the ancestors. Thus, we only memoize as long
611   // as there is a single parent.
memoizedMatchesAncestorOfRecursively(const ast_type_traits::DynTypedNode & Node,const DynTypedMatcher & Matcher,BoundNodesTreeBuilder * Builder,AncestorMatchMode MatchMode)612   bool memoizedMatchesAncestorOfRecursively(
613       const ast_type_traits::DynTypedNode &Node, const DynTypedMatcher &Matcher,
614       BoundNodesTreeBuilder *Builder, AncestorMatchMode MatchMode) {
615     if (Node.get<TranslationUnitDecl>() ==
616         ActiveASTContext->getTranslationUnitDecl())
617       return false;
618 
619     // For AST-nodes that don't have an identity, we can't memoize.
620     if (!Builder->isComparable())
621       return matchesAncestorOfRecursively(Node, Matcher, Builder, MatchMode);
622 
623     MatchKey Key;
624     Key.MatcherID = Matcher.getID();
625     Key.Node = Node;
626     Key.BoundNodes = *Builder;
627 
628     // Note that we cannot use insert and reuse the iterator, as recursive
629     // calls to match might invalidate the result cache iterators.
630     MemoizationMap::iterator I = ResultCache.find(Key);
631     if (I != ResultCache.end()) {
632       *Builder = I->second.Nodes;
633       return I->second.ResultOfMatch;
634     }
635 
636     MemoizedMatchResult Result;
637     Result.Nodes = *Builder;
638     Result.ResultOfMatch =
639         matchesAncestorOfRecursively(Node, Matcher, &Result.Nodes, MatchMode);
640 
641     MemoizedMatchResult &CachedResult = ResultCache[Key];
642     CachedResult = std::move(Result);
643 
644     *Builder = CachedResult.Nodes;
645     return CachedResult.ResultOfMatch;
646   }
647 
matchesAncestorOfRecursively(const ast_type_traits::DynTypedNode & Node,const DynTypedMatcher & Matcher,BoundNodesTreeBuilder * Builder,AncestorMatchMode MatchMode)648   bool matchesAncestorOfRecursively(const ast_type_traits::DynTypedNode &Node,
649                                     const DynTypedMatcher &Matcher,
650                                     BoundNodesTreeBuilder *Builder,
651                                     AncestorMatchMode MatchMode) {
652     const auto &Parents = ActiveASTContext->getParents(Node);
653     assert(!Parents.empty() && "Found node that is not in the parent map.");
654     if (Parents.size() == 1) {
655       // Only one parent - do recursive memoization.
656       const ast_type_traits::DynTypedNode Parent = Parents[0];
657       BoundNodesTreeBuilder BuilderCopy = *Builder;
658       if (Matcher.matches(Parent, this, &BuilderCopy)) {
659         *Builder = std::move(BuilderCopy);
660         return true;
661       }
662       if (MatchMode != ASTMatchFinder::AMM_ParentOnly) {
663         return memoizedMatchesAncestorOfRecursively(Parent, Matcher, Builder,
664                                                     MatchMode);
665         // Once we get back from the recursive call, the result will be the
666         // same as the parent's result.
667       }
668     } else {
669       // Multiple parents - BFS over the rest of the nodes.
670       llvm::DenseSet<const void *> Visited;
671       std::deque<ast_type_traits::DynTypedNode> Queue(Parents.begin(),
672                                                       Parents.end());
673       while (!Queue.empty()) {
674         BoundNodesTreeBuilder BuilderCopy = *Builder;
675         if (Matcher.matches(Queue.front(), this, &BuilderCopy)) {
676           *Builder = std::move(BuilderCopy);
677           return true;
678         }
679         if (MatchMode != ASTMatchFinder::AMM_ParentOnly) {
680           for (const auto &Parent :
681                ActiveASTContext->getParents(Queue.front())) {
682             // Make sure we do not visit the same node twice.
683             // Otherwise, we'll visit the common ancestors as often as there
684             // are splits on the way down.
685             if (Visited.insert(Parent.getMemoizationData()).second)
686               Queue.push_back(Parent);
687           }
688         }
689         Queue.pop_front();
690       }
691     }
692     return false;
693   }
694 
695   // Implements a BoundNodesTree::Visitor that calls a MatchCallback with
696   // the aggregated bound nodes for each match.
697   class MatchVisitor : public BoundNodesTreeBuilder::Visitor {
698   public:
MatchVisitor(ASTContext * Context,MatchFinder::MatchCallback * Callback)699     MatchVisitor(ASTContext* Context,
700                  MatchFinder::MatchCallback* Callback)
701       : Context(Context),
702         Callback(Callback) {}
703 
visitMatch(const BoundNodes & BoundNodesView)704     void visitMatch(const BoundNodes& BoundNodesView) override {
705       Callback->run(MatchFinder::MatchResult(BoundNodesView, Context));
706     }
707 
708   private:
709     ASTContext* Context;
710     MatchFinder::MatchCallback* Callback;
711   };
712 
713   // Returns true if 'TypeNode' has an alias that matches the given matcher.
typeHasMatchingAlias(const Type * TypeNode,const Matcher<NamedDecl> & Matcher,BoundNodesTreeBuilder * Builder)714   bool typeHasMatchingAlias(const Type *TypeNode,
715                             const Matcher<NamedDecl> &Matcher,
716                             BoundNodesTreeBuilder *Builder) {
717     const Type *const CanonicalType =
718       ActiveASTContext->getCanonicalType(TypeNode);
719     for (const TypedefNameDecl *Alias : TypeAliases.lookup(CanonicalType)) {
720       BoundNodesTreeBuilder Result(*Builder);
721       if (Matcher.matches(*Alias, this, &Result)) {
722         *Builder = std::move(Result);
723         return true;
724       }
725     }
726     return false;
727   }
728 
729   /// \brief Bucket to record map.
730   ///
731   /// Used to get the appropriate bucket for each matcher.
732   llvm::StringMap<llvm::TimeRecord> TimeByBucket;
733 
734   const MatchFinder::MatchersByType *Matchers;
735 
736   /// \brief Filtered list of matcher indices for each matcher kind.
737   ///
738   /// \c Decl and \c Stmt toplevel matchers usually apply to a specific node
739   /// kind (and derived kinds) so it is a waste to try every matcher on every
740   /// node.
741   /// We precalculate a list of matchers that pass the toplevel restrict check.
742   /// This also allows us to skip the restrict check at matching time. See
743   /// use \c matchesNoKindCheck() above.
744   llvm::DenseMap<ast_type_traits::ASTNodeKind, std::vector<unsigned short>>
745       MatcherFiltersMap;
746 
747   const MatchFinder::MatchFinderOptions &Options;
748   ASTContext *ActiveASTContext;
749 
750   // Maps a canonical type to its TypedefDecls.
751   llvm::DenseMap<const Type*, std::set<const TypedefNameDecl*> > TypeAliases;
752 
753   // Maps (matcher, node) -> the match result for memoization.
754   typedef std::map<MatchKey, MemoizedMatchResult> MemoizationMap;
755   MemoizationMap ResultCache;
756 };
757 
758 static CXXRecordDecl *
getAsCXXRecordDeclOrPrimaryTemplate(const Type * TypeNode)759 getAsCXXRecordDeclOrPrimaryTemplate(const Type *TypeNode) {
760   if (auto *RD = TypeNode->getAsCXXRecordDecl())
761     return RD;
762 
763   // Find the innermost TemplateSpecializationType that isn't an alias template.
764   auto *TemplateType = TypeNode->getAs<TemplateSpecializationType>();
765   while (TemplateType && TemplateType->isTypeAlias())
766     TemplateType =
767         TemplateType->getAliasedType()->getAs<TemplateSpecializationType>();
768 
769   // If this is the name of a (dependent) template specialization, use the
770   // definition of the template, even though it might be specialized later.
771   if (TemplateType)
772     if (auto *ClassTemplate = dyn_cast_or_null<ClassTemplateDecl>(
773           TemplateType->getTemplateName().getAsTemplateDecl()))
774       return ClassTemplate->getTemplatedDecl();
775 
776   return nullptr;
777 }
778 
779 // Returns true if the given class is directly or indirectly derived
780 // from a base type with the given name.  A class is not considered to be
781 // derived from itself.
classIsDerivedFrom(const CXXRecordDecl * Declaration,const Matcher<NamedDecl> & Base,BoundNodesTreeBuilder * Builder)782 bool MatchASTVisitor::classIsDerivedFrom(const CXXRecordDecl *Declaration,
783                                          const Matcher<NamedDecl> &Base,
784                                          BoundNodesTreeBuilder *Builder) {
785   if (!Declaration->hasDefinition())
786     return false;
787   for (const auto &It : Declaration->bases()) {
788     const Type *TypeNode = It.getType().getTypePtr();
789 
790     if (typeHasMatchingAlias(TypeNode, Base, Builder))
791       return true;
792 
793     // FIXME: Going to the primary template here isn't really correct, but
794     // unfortunately we accept a Decl matcher for the base class not a Type
795     // matcher, so it's the best thing we can do with our current interface.
796     CXXRecordDecl *ClassDecl = getAsCXXRecordDeclOrPrimaryTemplate(TypeNode);
797     if (!ClassDecl)
798       continue;
799     if (ClassDecl == Declaration) {
800       // This can happen for recursive template definitions; if the
801       // current declaration did not match, we can safely return false.
802       return false;
803     }
804     BoundNodesTreeBuilder Result(*Builder);
805     if (Base.matches(*ClassDecl, this, &Result)) {
806       *Builder = std::move(Result);
807       return true;
808     }
809     if (classIsDerivedFrom(ClassDecl, Base, Builder))
810       return true;
811   }
812   return false;
813 }
814 
TraverseDecl(Decl * DeclNode)815 bool MatchASTVisitor::TraverseDecl(Decl *DeclNode) {
816   if (!DeclNode) {
817     return true;
818   }
819   match(*DeclNode);
820   return RecursiveASTVisitor<MatchASTVisitor>::TraverseDecl(DeclNode);
821 }
822 
TraverseStmt(Stmt * StmtNode)823 bool MatchASTVisitor::TraverseStmt(Stmt *StmtNode) {
824   if (!StmtNode) {
825     return true;
826   }
827   match(*StmtNode);
828   return RecursiveASTVisitor<MatchASTVisitor>::TraverseStmt(StmtNode);
829 }
830 
TraverseType(QualType TypeNode)831 bool MatchASTVisitor::TraverseType(QualType TypeNode) {
832   match(TypeNode);
833   return RecursiveASTVisitor<MatchASTVisitor>::TraverseType(TypeNode);
834 }
835 
TraverseTypeLoc(TypeLoc TypeLocNode)836 bool MatchASTVisitor::TraverseTypeLoc(TypeLoc TypeLocNode) {
837   // The RecursiveASTVisitor only visits types if they're not within TypeLocs.
838   // We still want to find those types via matchers, so we match them here. Note
839   // that the TypeLocs are structurally a shadow-hierarchy to the expressed
840   // type, so we visit all involved parts of a compound type when matching on
841   // each TypeLoc.
842   match(TypeLocNode);
843   match(TypeLocNode.getType());
844   return RecursiveASTVisitor<MatchASTVisitor>::TraverseTypeLoc(TypeLocNode);
845 }
846 
TraverseNestedNameSpecifier(NestedNameSpecifier * NNS)847 bool MatchASTVisitor::TraverseNestedNameSpecifier(NestedNameSpecifier *NNS) {
848   match(*NNS);
849   return RecursiveASTVisitor<MatchASTVisitor>::TraverseNestedNameSpecifier(NNS);
850 }
851 
TraverseNestedNameSpecifierLoc(NestedNameSpecifierLoc NNS)852 bool MatchASTVisitor::TraverseNestedNameSpecifierLoc(
853     NestedNameSpecifierLoc NNS) {
854   if (!NNS)
855     return true;
856 
857   match(NNS);
858 
859   // We only match the nested name specifier here (as opposed to traversing it)
860   // because the traversal is already done in the parallel "Loc"-hierarchy.
861   if (NNS.hasQualifier())
862     match(*NNS.getNestedNameSpecifier());
863   return
864       RecursiveASTVisitor<MatchASTVisitor>::TraverseNestedNameSpecifierLoc(NNS);
865 }
866 
867 class MatchASTConsumer : public ASTConsumer {
868 public:
MatchASTConsumer(MatchFinder * Finder,MatchFinder::ParsingDoneTestCallback * ParsingDone)869   MatchASTConsumer(MatchFinder *Finder,
870                    MatchFinder::ParsingDoneTestCallback *ParsingDone)
871       : Finder(Finder), ParsingDone(ParsingDone) {}
872 
873 private:
HandleTranslationUnit(ASTContext & Context)874   void HandleTranslationUnit(ASTContext &Context) override {
875     if (ParsingDone != nullptr) {
876       ParsingDone->run();
877     }
878     Finder->matchAST(Context);
879   }
880 
881   MatchFinder *Finder;
882   MatchFinder::ParsingDoneTestCallback *ParsingDone;
883 };
884 
885 } // end namespace
886 } // end namespace internal
887 
MatchResult(const BoundNodes & Nodes,ASTContext * Context)888 MatchFinder::MatchResult::MatchResult(const BoundNodes &Nodes,
889                                       ASTContext *Context)
890   : Nodes(Nodes), Context(Context),
891     SourceManager(&Context->getSourceManager()) {}
892 
~MatchCallback()893 MatchFinder::MatchCallback::~MatchCallback() {}
~ParsingDoneTestCallback()894 MatchFinder::ParsingDoneTestCallback::~ParsingDoneTestCallback() {}
895 
MatchFinder(MatchFinderOptions Options)896 MatchFinder::MatchFinder(MatchFinderOptions Options)
897     : Options(std::move(Options)), ParsingDone(nullptr) {}
898 
~MatchFinder()899 MatchFinder::~MatchFinder() {}
900 
addMatcher(const DeclarationMatcher & NodeMatch,MatchCallback * Action)901 void MatchFinder::addMatcher(const DeclarationMatcher &NodeMatch,
902                              MatchCallback *Action) {
903   Matchers.DeclOrStmt.emplace_back(NodeMatch, Action);
904   Matchers.AllCallbacks.insert(Action);
905 }
906 
addMatcher(const TypeMatcher & NodeMatch,MatchCallback * Action)907 void MatchFinder::addMatcher(const TypeMatcher &NodeMatch,
908                              MatchCallback *Action) {
909   Matchers.Type.emplace_back(NodeMatch, Action);
910   Matchers.AllCallbacks.insert(Action);
911 }
912 
addMatcher(const StatementMatcher & NodeMatch,MatchCallback * Action)913 void MatchFinder::addMatcher(const StatementMatcher &NodeMatch,
914                              MatchCallback *Action) {
915   Matchers.DeclOrStmt.emplace_back(NodeMatch, Action);
916   Matchers.AllCallbacks.insert(Action);
917 }
918 
addMatcher(const NestedNameSpecifierMatcher & NodeMatch,MatchCallback * Action)919 void MatchFinder::addMatcher(const NestedNameSpecifierMatcher &NodeMatch,
920                              MatchCallback *Action) {
921   Matchers.NestedNameSpecifier.emplace_back(NodeMatch, Action);
922   Matchers.AllCallbacks.insert(Action);
923 }
924 
addMatcher(const NestedNameSpecifierLocMatcher & NodeMatch,MatchCallback * Action)925 void MatchFinder::addMatcher(const NestedNameSpecifierLocMatcher &NodeMatch,
926                              MatchCallback *Action) {
927   Matchers.NestedNameSpecifierLoc.emplace_back(NodeMatch, Action);
928   Matchers.AllCallbacks.insert(Action);
929 }
930 
addMatcher(const TypeLocMatcher & NodeMatch,MatchCallback * Action)931 void MatchFinder::addMatcher(const TypeLocMatcher &NodeMatch,
932                              MatchCallback *Action) {
933   Matchers.TypeLoc.emplace_back(NodeMatch, Action);
934   Matchers.AllCallbacks.insert(Action);
935 }
936 
addDynamicMatcher(const internal::DynTypedMatcher & NodeMatch,MatchCallback * Action)937 bool MatchFinder::addDynamicMatcher(const internal::DynTypedMatcher &NodeMatch,
938                                     MatchCallback *Action) {
939   if (NodeMatch.canConvertTo<Decl>()) {
940     addMatcher(NodeMatch.convertTo<Decl>(), Action);
941     return true;
942   } else if (NodeMatch.canConvertTo<QualType>()) {
943     addMatcher(NodeMatch.convertTo<QualType>(), Action);
944     return true;
945   } else if (NodeMatch.canConvertTo<Stmt>()) {
946     addMatcher(NodeMatch.convertTo<Stmt>(), Action);
947     return true;
948   } else if (NodeMatch.canConvertTo<NestedNameSpecifier>()) {
949     addMatcher(NodeMatch.convertTo<NestedNameSpecifier>(), Action);
950     return true;
951   } else if (NodeMatch.canConvertTo<NestedNameSpecifierLoc>()) {
952     addMatcher(NodeMatch.convertTo<NestedNameSpecifierLoc>(), Action);
953     return true;
954   } else if (NodeMatch.canConvertTo<TypeLoc>()) {
955     addMatcher(NodeMatch.convertTo<TypeLoc>(), Action);
956     return true;
957   }
958   return false;
959 }
960 
newASTConsumer()961 std::unique_ptr<ASTConsumer> MatchFinder::newASTConsumer() {
962   return llvm::make_unique<internal::MatchASTConsumer>(this, ParsingDone);
963 }
964 
match(const clang::ast_type_traits::DynTypedNode & Node,ASTContext & Context)965 void MatchFinder::match(const clang::ast_type_traits::DynTypedNode &Node,
966                         ASTContext &Context) {
967   internal::MatchASTVisitor Visitor(&Matchers, Options);
968   Visitor.set_active_ast_context(&Context);
969   Visitor.match(Node);
970 }
971 
matchAST(ASTContext & Context)972 void MatchFinder::matchAST(ASTContext &Context) {
973   internal::MatchASTVisitor Visitor(&Matchers, Options);
974   Visitor.set_active_ast_context(&Context);
975   Visitor.onStartOfTranslationUnit();
976   Visitor.TraverseDecl(Context.getTranslationUnitDecl());
977   Visitor.onEndOfTranslationUnit();
978 }
979 
registerTestCallbackAfterParsing(MatchFinder::ParsingDoneTestCallback * NewParsingDone)980 void MatchFinder::registerTestCallbackAfterParsing(
981     MatchFinder::ParsingDoneTestCallback *NewParsingDone) {
982   ParsingDone = NewParsingDone;
983 }
984 
getID() const985 StringRef MatchFinder::MatchCallback::getID() const { return "<unknown>"; }
986 
987 } // end namespace ast_matchers
988 } // end namespace clang
989