1 //===--- FunctionCognitiveComplexityCheck.cpp - clang-tidy ------*- C++ -*-===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 
9 #include "FunctionCognitiveComplexityCheck.h"
10 #include "../ClangTidyDiagnosticConsumer.h"
11 #include "clang/AST/Decl.h"
12 #include "clang/AST/DeclBase.h"
13 #include "clang/AST/Expr.h"
14 #include "clang/AST/RecursiveASTVisitor.h"
15 #include "clang/AST/Stmt.h"
16 #include "clang/ASTMatchers/ASTMatchFinder.h"
17 #include "clang/ASTMatchers/ASTMatchers.h"
18 #include "clang/ASTMatchers/ASTMatchersInternal.h"
19 #include "clang/Basic/Diagnostic.h"
20 #include "clang/Basic/DiagnosticIDs.h"
21 #include "clang/Basic/LLVM.h"
22 #include "clang/Basic/SourceLocation.h"
23 #include "llvm/ADT/Optional.h"
24 #include "llvm/ADT/SmallVector.h"
25 #include "llvm/Support/Casting.h"
26 #include "llvm/Support/ErrorHandling.h"
27 #include <array>
28 #include <cassert>
29 #include <stack>
30 #include <tuple>
31 #include <type_traits>
32 #include <utility>
33 
34 using namespace clang::ast_matchers;
35 
36 namespace clang {
37 namespace tidy {
38 namespace readability {
39 namespace {
40 
41 struct CognitiveComplexity final {
42   // Any increment is based on some combination of reasons.
43   // For details you can look at the Specification at
44   // https://www.sonarsource.com/docs/CognitiveComplexity.pdf
45   // or user-facing docs at
46   // http://clang.llvm.org/extra/clang-tidy/checks/readability-function-cognitive-complexity.html
47   // Here are all the possible reasons:
48   enum Criteria : uint8_t {
49     None = 0U,
50 
51     // B1, increases cognitive complexity (by 1)
52     // What causes it:
53     // * if, else if, else, ConditionalOperator (not BinaryConditionalOperator)
54     // * SwitchStmt
55     // * ForStmt, CXXForRangeStmt
56     // * WhileStmt, DoStmt
57     // * CXXCatchStmt
58     // * GotoStmt, IndirectGotoStmt (but not BreakStmt, ContinueStmt)
59     // * sequences of binary logical operators (BinOpLAnd, BinOpLOr)
60     // * each method in a recursion cycle (not implemented)
61     Increment = 1U << 0,
62 
63     // B2, increases current nesting level (by 1)
64     // What causes it:
65     // * if, else if, else, ConditionalOperator (not BinaryConditionalOperator)
66     // * SwitchStmt
67     // * ForStmt, CXXForRangeStmt
68     // * WhileStmt, DoStmt
69     // * CXXCatchStmt
70     // * nested CXXConstructor, CXXDestructor, CXXMethod (incl. C++11 Lambda)
71     // * GNU Statement Expression
72     // * Apple Block declaration
73     IncrementNesting = 1U << 1,
74 
75     // B3, increases cognitive complexity by the current nesting level
76     // Applied before IncrementNesting
77     // What causes it:
78     // * IfStmt, ConditionalOperator (not BinaryConditionalOperator)
79     // * SwitchStmt
80     // * ForStmt, CXXForRangeStmt
81     // * WhileStmt, DoStmt
82     // * CXXCatchStmt
83     PenalizeNesting = 1U << 2,
84 
85     All = Increment | PenalizeNesting | IncrementNesting,
86   };
87 
88   // The helper struct used to record one increment occurrence, with all the
89   // details nessesary.
90   struct Detail {
91     const SourceLocation Loc;     // What caused the increment?
92     const unsigned short Nesting; // How deeply nested is Loc located?
93     const Criteria C;             // The criteria of the increment
94 
Detailclang::tidy::readability::__anon7c293f010111::CognitiveComplexity::Detail95     Detail(SourceLocation SLoc, unsigned short CurrentNesting, Criteria Crit)
96         : Loc(SLoc), Nesting(CurrentNesting), C(Crit) {}
97 
98     // To minimize the sizeof(Detail), we only store the minimal info there.
99     // This function is used to convert from the stored info into the usable
100     // information - what message to output, how much of an increment did this
101     // occurrence actually result in.
processclang::tidy::readability::__anon7c293f010111::CognitiveComplexity::Detail102     std::pair<unsigned, unsigned short> process() const {
103       assert(C != Criteria::None && "invalid criteria");
104 
105       unsigned MsgId;           // The id of the message to output.
106       unsigned short Increment; // How much of an increment?
107 
108       if (C == Criteria::All) {
109         Increment = 1 + Nesting;
110         MsgId = 0;
111       } else if (C == (Criteria::Increment | Criteria::IncrementNesting)) {
112         Increment = 1;
113         MsgId = 1;
114       } else if (C == Criteria::Increment) {
115         Increment = 1;
116         MsgId = 2;
117       } else if (C == Criteria::IncrementNesting) {
118         Increment = 0; // Unused in this message.
119         MsgId = 3;
120       } else
121         llvm_unreachable("should not get to here.");
122 
123       return std::make_pair(MsgId, Increment);
124     }
125   };
126 
127   // Limit of 25 is the "upstream"'s default.
128   static constexpr unsigned DefaultLimit = 25U;
129 
130   // Based on the publicly-avaliable numbers for some big open-source projects
131   // https://sonarcloud.io/projects?languages=c%2Ccpp&size=5   we can estimate:
132   // value ~20 would result in no allocs for 98% of functions, ~12 for 96%, ~10
133   // for 91%, ~8 for 88%, ~6 for 84%, ~4 for 77%, ~2 for 64%, and ~1 for 37%.
134   static_assert(sizeof(Detail) <= 8,
135                 "Since we use SmallVector to minimize the amount of "
136                 "allocations, we also need to consider the price we pay for "
137                 "that in terms of stack usage. "
138                 "Thus, it is good to minimize the size of the Detail struct.");
139   SmallVector<Detail, DefaultLimit> Details; // 25 elements is 200 bytes.
140   // Yes, 25 is a magic number. This is the seemingly-sane default for the
141   // upper limit for function cognitive complexity. Thus it would make sense
142   // to avoid allocations for any function that does not violate the limit.
143 
144   // The grand total Cognitive Complexity of the function.
145   unsigned Total = 0;
146 
147   // The function used to store new increment, calculate the total complexity.
148   void account(SourceLocation Loc, unsigned short Nesting, Criteria C);
149 };
150 
151 // All the possible messages that can be output. The choice of the message
152 // to use is based of the combination of the CognitiveComplexity::Criteria.
153 // It would be nice to have it in CognitiveComplexity struct, but then it is
154 // not static.
155 static const std::array<const StringRef, 4> Msgs = {{
156     // B1 + B2 + B3
157     "+%0, including nesting penalty of %1, nesting level increased to %2",
158 
159     // B1 + B2
160     "+%0, nesting level increased to %2",
161 
162     // B1
163     "+%0",
164 
165     // B2
166     "nesting level increased to %2",
167 }};
168 
169 // Criteria is a bitset, thus a few helpers are needed.
operator |(CognitiveComplexity::Criteria LHS,CognitiveComplexity::Criteria RHS)170 CognitiveComplexity::Criteria operator|(CognitiveComplexity::Criteria LHS,
171                                         CognitiveComplexity::Criteria RHS) {
172   return static_cast<CognitiveComplexity::Criteria>(
173       static_cast<std::underlying_type<CognitiveComplexity::Criteria>::type>(
174           LHS) |
175       static_cast<std::underlying_type<CognitiveComplexity::Criteria>::type>(
176           RHS));
177 }
operator &(CognitiveComplexity::Criteria LHS,CognitiveComplexity::Criteria RHS)178 CognitiveComplexity::Criteria operator&(CognitiveComplexity::Criteria LHS,
179                                         CognitiveComplexity::Criteria RHS) {
180   return static_cast<CognitiveComplexity::Criteria>(
181       static_cast<std::underlying_type<CognitiveComplexity::Criteria>::type>(
182           LHS) &
183       static_cast<std::underlying_type<CognitiveComplexity::Criteria>::type>(
184           RHS));
185 }
operator |=(CognitiveComplexity::Criteria & LHS,CognitiveComplexity::Criteria RHS)186 CognitiveComplexity::Criteria &operator|=(CognitiveComplexity::Criteria &LHS,
187                                           CognitiveComplexity::Criteria RHS) {
188   LHS = operator|(LHS, RHS);
189   return LHS;
190 }
operator &=(CognitiveComplexity::Criteria & LHS,CognitiveComplexity::Criteria RHS)191 CognitiveComplexity::Criteria &operator&=(CognitiveComplexity::Criteria &LHS,
192                                           CognitiveComplexity::Criteria RHS) {
193   LHS = operator&(LHS, RHS);
194   return LHS;
195 }
196 
account(SourceLocation Loc,unsigned short Nesting,Criteria C)197 void CognitiveComplexity::account(SourceLocation Loc, unsigned short Nesting,
198                                   Criteria C) {
199   C &= Criteria::All;
200   assert(C != Criteria::None && "invalid criteria");
201 
202   Details.emplace_back(Loc, Nesting, C);
203   const Detail &D = Details.back();
204 
205   unsigned MsgId;
206   unsigned short Increase;
207   std::tie(MsgId, Increase) = D.process();
208 
209   Total += Increase;
210 }
211 
212 class FunctionASTVisitor final
213     : public RecursiveASTVisitor<FunctionASTVisitor> {
214   using Base = RecursiveASTVisitor<FunctionASTVisitor>;
215 
216   // The current nesting level (increased by Criteria::IncrementNesting).
217   unsigned short CurrentNestingLevel = 0;
218 
219   // Used to efficiently know the last type of the binary sequence operator
220   // that was encountered. It would make sense for the function call to start
221   // the new sequence, thus it is a stack.
222   using OBO = Optional<BinaryOperator::Opcode>;
223   std::stack<OBO, SmallVector<OBO, 4>> BinaryOperatorsStack;
224 
225 public:
TraverseStmtWithIncreasedNestingLevel(Stmt * Node)226   bool TraverseStmtWithIncreasedNestingLevel(Stmt *Node) {
227     ++CurrentNestingLevel;
228     bool ShouldContinue = Base::TraverseStmt(Node);
229     --CurrentNestingLevel;
230     return ShouldContinue;
231   }
232 
TraverseDeclWithIncreasedNestingLevel(Decl * Node)233   bool TraverseDeclWithIncreasedNestingLevel(Decl *Node) {
234     ++CurrentNestingLevel;
235     bool ShouldContinue = Base::TraverseDecl(Node);
236     --CurrentNestingLevel;
237     return ShouldContinue;
238   }
239 
TraverseIfStmt(IfStmt * Node,bool InElseIf=false)240   bool TraverseIfStmt(IfStmt *Node, bool InElseIf = false) {
241     if (!Node)
242       return Base::TraverseIfStmt(Node);
243 
244     {
245       CognitiveComplexity::Criteria Reasons;
246 
247       Reasons = CognitiveComplexity::Criteria::None;
248 
249       // "If" increases cognitive complexity.
250       Reasons |= CognitiveComplexity::Criteria::Increment;
251       // "If" increases nesting level.
252       Reasons |= CognitiveComplexity::Criteria::IncrementNesting;
253 
254       if (!InElseIf) {
255         // "If" receives a nesting increment commensurate with it's nested
256         // depth, if it is not part of "else if".
257         Reasons |= CognitiveComplexity::Criteria::PenalizeNesting;
258       }
259 
260       CC.account(Node->getIfLoc(), CurrentNestingLevel, Reasons);
261     }
262 
263     // If this IfStmt is *NOT* "else if", then only the body (i.e. "Then" and
264     // "Else") is traversed with increased Nesting level.
265     // However if this IfStmt *IS* "else if", then Nesting level is increased
266     // for the whole IfStmt (i.e. for "Init", "Cond", "Then" and "Else").
267 
268     if (!InElseIf) {
269       if (!TraverseStmt(Node->getInit()))
270         return false;
271 
272       if (!TraverseStmt(Node->getCond()))
273         return false;
274     } else {
275       if (!TraverseStmtWithIncreasedNestingLevel(Node->getInit()))
276         return false;
277 
278       if (!TraverseStmtWithIncreasedNestingLevel(Node->getCond()))
279         return false;
280     }
281 
282     // "Then" always increases nesting level.
283     if (!TraverseStmtWithIncreasedNestingLevel(Node->getThen()))
284       return false;
285 
286     if (!Node->getElse())
287       return true;
288 
289     if (auto *E = dyn_cast<IfStmt>(Node->getElse()))
290       return TraverseIfStmt(E, true);
291 
292     {
293       CognitiveComplexity::Criteria Reasons;
294 
295       Reasons = CognitiveComplexity::Criteria::None;
296 
297       // "Else" increases cognitive complexity.
298       Reasons |= CognitiveComplexity::Criteria::Increment;
299       // "Else" increases nesting level.
300       Reasons |= CognitiveComplexity::Criteria::IncrementNesting;
301       // "Else" DOES NOT receive a nesting increment commensurate with it's
302       // nested depth.
303 
304       CC.account(Node->getElseLoc(), CurrentNestingLevel, Reasons);
305     }
306 
307     // "Else" always increases nesting level.
308     return TraverseStmtWithIncreasedNestingLevel(Node->getElse());
309   }
310 
311 // The currently-being-processed stack entry, which is always the top.
312 #define CurrentBinaryOperator BinaryOperatorsStack.top()
313 
314   // In a sequence of binary logical operators, if the new operator is different
315   // from the previous one, then the cognitive complexity is increased.
TraverseBinaryOperator(BinaryOperator * Op)316   bool TraverseBinaryOperator(BinaryOperator *Op) {
317     if (!Op || !Op->isLogicalOp())
318       return Base::TraverseBinaryOperator(Op);
319 
320     // Make sure that there is always at least one frame in the stack.
321     if (BinaryOperatorsStack.empty())
322       BinaryOperatorsStack.emplace();
323 
324     // If this is the first binary operator that we are processing, or the
325     // previous binary operator was different, there is an increment.
326     if (!CurrentBinaryOperator || Op->getOpcode() != CurrentBinaryOperator)
327       CC.account(Op->getOperatorLoc(), CurrentNestingLevel,
328                  CognitiveComplexity::Criteria::Increment);
329 
330     // We might encounter a function call, which starts a new sequence, thus
331     // we need to save the current previous binary operator.
332     const Optional<BinaryOperator::Opcode> BinOpCopy(CurrentBinaryOperator);
333 
334     // Record the operator that we are currently processing and traverse it.
335     CurrentBinaryOperator = Op->getOpcode();
336     bool ShouldContinue = Base::TraverseBinaryOperator(Op);
337 
338     // And restore the previous binary operator, which might be nonexistent.
339     CurrentBinaryOperator = BinOpCopy;
340 
341     return ShouldContinue;
342   }
343 
344   // It would make sense for the function call to start the new binary
345   // operator sequence, thus let's make sure that it creates a new stack frame.
TraverseCallExpr(CallExpr * Node)346   bool TraverseCallExpr(CallExpr *Node) {
347     // If we are not currently processing any binary operator sequence, then
348     // no Node-handling is needed.
349     if (!Node || BinaryOperatorsStack.empty() || !CurrentBinaryOperator)
350       return Base::TraverseCallExpr(Node);
351 
352     // Else, do add [uninitialized] frame to the stack, and traverse call.
353     BinaryOperatorsStack.emplace();
354     bool ShouldContinue = Base::TraverseCallExpr(Node);
355     // And remove the top frame.
356     BinaryOperatorsStack.pop();
357 
358     return ShouldContinue;
359   }
360 
361 #undef CurrentBinaryOperator
362 
TraverseStmt(Stmt * Node)363   bool TraverseStmt(Stmt *Node) {
364     if (!Node)
365       return Base::TraverseStmt(Node);
366 
367     // Three following switch()'es have huge duplication, but it is better to
368     // keep them separate, to simplify comparing them with the Specification.
369 
370     CognitiveComplexity::Criteria Reasons = CognitiveComplexity::Criteria::None;
371     SourceLocation Location = Node->getBeginLoc();
372 
373     // B1. Increments
374     // There is an increment for each of the following:
375     switch (Node->getStmtClass()) {
376     // if, else if, else are handled in TraverseIfStmt(),
377     // FIXME: "each method in a recursion cycle" Increment is not implemented.
378     case Stmt::ConditionalOperatorClass:
379     case Stmt::SwitchStmtClass:
380     case Stmt::ForStmtClass:
381     case Stmt::CXXForRangeStmtClass:
382     case Stmt::WhileStmtClass:
383     case Stmt::DoStmtClass:
384     case Stmt::CXXCatchStmtClass:
385     case Stmt::GotoStmtClass:
386     case Stmt::IndirectGotoStmtClass:
387       Reasons |= CognitiveComplexity::Criteria::Increment;
388       break;
389     default:
390       // break LABEL, continue LABEL increase cognitive complexity,
391       // but they are not supported in C++ or C.
392       // Regular break/continue do not increase cognitive complexity.
393       break;
394     }
395 
396     // B2. Nesting level
397     // The following structures increment the nesting level:
398     switch (Node->getStmtClass()) {
399     // if, else if, else are handled in TraverseIfStmt(),
400     // Nested methods and such are handled in TraverseDecl.
401     case Stmt::ConditionalOperatorClass:
402     case Stmt::SwitchStmtClass:
403     case Stmt::ForStmtClass:
404     case Stmt::CXXForRangeStmtClass:
405     case Stmt::WhileStmtClass:
406     case Stmt::DoStmtClass:
407     case Stmt::CXXCatchStmtClass:
408     case Stmt::LambdaExprClass:
409     case Stmt::StmtExprClass:
410       Reasons |= CognitiveComplexity::Criteria::IncrementNesting;
411       break;
412     default:
413       break;
414     }
415 
416     // B3. Nesting increments
417     // The following structures receive a nesting increment
418     // commensurate with their nested depth inside B2 structures:
419     switch (Node->getStmtClass()) {
420     // if, else if, else are handled in TraverseIfStmt().
421     case Stmt::ConditionalOperatorClass:
422     case Stmt::SwitchStmtClass:
423     case Stmt::ForStmtClass:
424     case Stmt::CXXForRangeStmtClass:
425     case Stmt::WhileStmtClass:
426     case Stmt::DoStmtClass:
427     case Stmt::CXXCatchStmtClass:
428       Reasons |= CognitiveComplexity::Criteria::PenalizeNesting;
429       break;
430     default:
431       break;
432     }
433 
434     if (Node->getStmtClass() == Stmt::ConditionalOperatorClass) {
435       // A little beautification.
436       // For conditional operator "cond ? true : false" point at the "?"
437       // symbol.
438       ConditionalOperator *COp = dyn_cast<ConditionalOperator>(Node);
439       Location = COp->getQuestionLoc();
440     }
441 
442     // If we have found any reasons, let's account it.
443     if (Reasons & CognitiveComplexity::Criteria::All)
444       CC.account(Location, CurrentNestingLevel, Reasons);
445 
446     // Did we decide that the nesting level should be increased?
447     if (!(Reasons & CognitiveComplexity::Criteria::IncrementNesting))
448       return Base::TraverseStmt(Node);
449 
450     return TraverseStmtWithIncreasedNestingLevel(Node);
451   }
452 
453   // The parameter MainAnalyzedFunction is needed to differentiate between the
454   // cases where TraverseDecl() is the entry point from
455   // FunctionCognitiveComplexityCheck::check() and the cases where it was called
456   // from the FunctionASTVisitor itself. Explanation: if we get a function
457   // definition (e.g. constructor, destructor, method), the Cognitive Complexity
458   // specification states that the Nesting level shall be increased. But if this
459   // function is the entry point, then the Nesting level should not be
460   // increased. Thus that parameter is there and is used to fall-through
461   // directly to traversing if this is the main function that is being analyzed.
TraverseDecl(Decl * Node,bool MainAnalyzedFunction=false)462   bool TraverseDecl(Decl *Node, bool MainAnalyzedFunction = false) {
463     if (!Node || MainAnalyzedFunction)
464       return Base::TraverseDecl(Node);
465 
466     // B2. Nesting level
467     // The following structures increment the nesting level:
468     switch (Node->getKind()) {
469     case Decl::Function:
470     case Decl::CXXMethod:
471     case Decl::CXXConstructor:
472     case Decl::CXXDestructor:
473     case Decl::Block:
474       break;
475     default:
476       // If this is something else, we use early return!
477       return Base::TraverseDecl(Node);
478       break;
479     }
480 
481     CC.account(Node->getBeginLoc(), CurrentNestingLevel,
482                CognitiveComplexity::Criteria::IncrementNesting);
483 
484     return TraverseDeclWithIncreasedNestingLevel(Node);
485   }
486 
487   CognitiveComplexity CC;
488 };
489 
490 } // namespace
491 
FunctionCognitiveComplexityCheck(StringRef Name,ClangTidyContext * Context)492 FunctionCognitiveComplexityCheck::FunctionCognitiveComplexityCheck(
493     StringRef Name, ClangTidyContext *Context)
494     : ClangTidyCheck(Name, Context),
495       Threshold(Options.get("Threshold", CognitiveComplexity::DefaultLimit)) {}
496 
storeOptions(ClangTidyOptions::OptionMap & Opts)497 void FunctionCognitiveComplexityCheck::storeOptions(
498     ClangTidyOptions::OptionMap &Opts) {
499   Options.store(Opts, "Threshold", Threshold);
500 }
501 
registerMatchers(MatchFinder * Finder)502 void FunctionCognitiveComplexityCheck::registerMatchers(MatchFinder *Finder) {
503   Finder->addMatcher(
504       functionDecl(isDefinition(),
505                    unless(anyOf(isDefaulted(), isDeleted(), isImplicit(),
506                                 isInstantiated(), isWeak())))
507           .bind("func"),
508       this);
509 }
510 
check(const MatchFinder::MatchResult & Result)511 void FunctionCognitiveComplexityCheck::check(
512     const MatchFinder::MatchResult &Result) {
513   const auto *Func = Result.Nodes.getNodeAs<FunctionDecl>("func");
514   assert(Func->hasBody() && "The matchers should only match the functions that "
515                             "have user-provided body.");
516 
517   FunctionASTVisitor Visitor;
518   Visitor.TraverseDecl(const_cast<FunctionDecl *>(Func), true);
519 
520   if (Visitor.CC.Total <= Threshold)
521     return;
522 
523   diag(Func->getLocation(),
524        "function %0 has cognitive complexity of %1 (threshold %2)")
525       << Func << Visitor.CC.Total << Threshold;
526 
527   // Output all the basic increments of complexity.
528   for (const auto &Detail : Visitor.CC.Details) {
529     unsigned MsgId;          // The id of the message to output.
530     unsigned short Increase; // How much of an increment?
531     std::tie(MsgId, Increase) = Detail.process();
532     assert(MsgId < Msgs.size() && "MsgId should always be valid");
533     // Increase, on the other hand, can be 0.
534 
535     diag(Detail.Loc, Msgs[MsgId], DiagnosticIDs::Note)
536         << (unsigned)Increase << (unsigned)Detail.Nesting << 1 + Detail.Nesting;
537   }
538 }
539 
540 } // namespace readability
541 } // namespace tidy
542 } // namespace clang
543